| /* |
| * Copyright (c) 2016, Alliance for Open Media. All rights reserved |
| * |
| * This source code is subject to the terms of the BSD 2 Clause License and |
| * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License |
| * was not distributed with this source code in the LICENSE file, you can |
| * obtain it at www.aomedia.org/license/software. If the Alliance for Open |
| * Media Patent License 1.0 was not distributed with this source code in the |
| * PATENTS file, you can obtain it at www.aomedia.org/license/patent. |
| */ |
| |
| #include <assert.h> |
| #include <math.h> |
| #include <string.h> |
| |
| #include "./aom_scale_rtcd.h" |
| #include "aom/aom_integer.h" |
| #include "av1/common/cdef.h" |
| #include "av1/common/cdef_block.h" |
| #include "av1/common/onyxc_int.h" |
| #include "av1/common/reconinter.h" |
| |
| int sb_all_skip(const AV1_COMMON *const cm, int mi_row, int mi_col) { |
| int r, c; |
| int maxc, maxr; |
| int skip = 1; |
| maxc = cm->mi_cols - mi_col; |
| maxr = cm->mi_rows - mi_row; |
| |
| maxr = AOMMIN(maxr, MI_SIZE_64X64); |
| maxc = AOMMIN(maxc, MI_SIZE_64X64); |
| |
| for (r = 0; r < maxr; r++) { |
| for (c = 0; c < maxc; c++) { |
| skip = skip && |
| cm->mi_grid_visible[(mi_row + r) * cm->mi_stride + mi_col + c] |
| ->mbmi.skip; |
| } |
| } |
| return skip; |
| } |
| |
| static int is_8x8_block_skip(MODE_INFO **grid, int mi_row, int mi_col, |
| int mi_stride) { |
| int is_skip = 1; |
| for (int r = 0; r < mi_size_high[BLOCK_8X8]; ++r) |
| for (int c = 0; c < mi_size_wide[BLOCK_8X8]; ++c) |
| is_skip &= grid[(mi_row + r) * mi_stride + (mi_col + c)]->mbmi.skip; |
| |
| return is_skip; |
| } |
| |
| int sb_compute_cdef_list(const AV1_COMMON *const cm, int mi_row, int mi_col, |
| cdef_list *dlist, int filter_skip) { |
| int r, c; |
| int maxc, maxr; |
| MODE_INFO **grid; |
| int count = 0; |
| grid = cm->mi_grid_visible; |
| maxc = cm->mi_cols - mi_col; |
| maxr = cm->mi_rows - mi_row; |
| |
| maxr = AOMMIN(maxr, MI_SIZE_64X64); |
| maxc = AOMMIN(maxc, MI_SIZE_64X64); |
| |
| const int r_step = mi_size_high[BLOCK_8X8]; |
| const int c_step = mi_size_wide[BLOCK_8X8]; |
| const int r_shift = (r_step == 2); |
| const int c_shift = (c_step == 2); |
| |
| assert(r_step == 1 || r_step == 2); |
| assert(c_step == 1 || c_step == 2); |
| |
| if (filter_skip) { |
| for (r = 0; r < maxr; r += r_step) { |
| for (c = 0; c < maxc; c += c_step) { |
| dlist[count].by = r >> r_shift; |
| dlist[count].bx = c >> c_shift; |
| dlist[count].skip = |
| is_8x8_block_skip(grid, mi_row + r, mi_col + c, cm->mi_stride); |
| count++; |
| } |
| } |
| } else { |
| for (r = 0; r < maxr; r += r_step) { |
| for (c = 0; c < maxc; c += c_step) { |
| if (!is_8x8_block_skip(grid, mi_row + r, mi_col + c, cm->mi_stride)) { |
| dlist[count].by = r >> r_shift; |
| dlist[count].bx = c >> c_shift; |
| dlist[count].skip = 0; |
| count++; |
| } |
| } |
| } |
| } |
| return count; |
| } |
| |
| void copy_rect8_8bit_to_16bit_c(uint16_t *dst, int dstride, const uint8_t *src, |
| int sstride, int v, int h) { |
| int i, j; |
| for (i = 0; i < v; i++) { |
| for (j = 0; j < h; j++) { |
| dst[i * dstride + j] = src[i * sstride + j]; |
| } |
| } |
| } |
| |
| void copy_rect8_16bit_to_16bit_c(uint16_t *dst, int dstride, |
| const uint16_t *src, int sstride, int v, |
| int h) { |
| int i, j; |
| for (i = 0; i < v; i++) { |
| for (j = 0; j < h; j++) { |
| dst[i * dstride + j] = src[i * sstride + j]; |
| } |
| } |
| } |
| |
| static void copy_sb8_16(AOM_UNUSED AV1_COMMON *cm, uint16_t *dst, int dstride, |
| const uint8_t *src, int src_voffset, int src_hoffset, |
| int sstride, int vsize, int hsize) { |
| #if CONFIG_HIGHBITDEPTH |
| if (cm->use_highbitdepth) { |
| const uint16_t *base = |
| &CONVERT_TO_SHORTPTR(src)[src_voffset * sstride + src_hoffset]; |
| copy_rect8_16bit_to_16bit(dst, dstride, base, sstride, vsize, hsize); |
| } else { |
| #endif |
| const uint8_t *base = &src[src_voffset * sstride + src_hoffset]; |
| copy_rect8_8bit_to_16bit(dst, dstride, base, sstride, vsize, hsize); |
| #if CONFIG_HIGHBITDEPTH |
| } |
| #endif |
| } |
| |
| static INLINE void fill_rect(uint16_t *dst, int dstride, int v, int h, |
| uint16_t x) { |
| int i, j; |
| for (i = 0; i < v; i++) { |
| for (j = 0; j < h; j++) { |
| dst[i * dstride + j] = x; |
| } |
| } |
| } |
| |
| static INLINE void copy_rect(uint16_t *dst, int dstride, const uint16_t *src, |
| int sstride, int v, int h) { |
| int i, j; |
| for (i = 0; i < v; i++) { |
| for (j = 0; j < h; j++) { |
| dst[i * dstride + j] = src[i * sstride + j]; |
| } |
| } |
| } |
| |
| void av1_cdef_frame(YV12_BUFFER_CONFIG *frame, AV1_COMMON *cm, |
| MACROBLOCKD *xd) { |
| int fbr, fbc; |
| int nhfb, nvfb; |
| DECLARE_ALIGNED(16, uint16_t, src[CDEF_INBUF_SIZE]); |
| uint16_t *linebuf[3]; |
| uint16_t *colbuf[3]; |
| cdef_list dlist[MI_SIZE_64X64 * MI_SIZE_64X64]; |
| unsigned char *row_cdef, *prev_row_cdef, *curr_row_cdef; |
| int cdef_count; |
| int dir[CDEF_NBLOCKS][CDEF_NBLOCKS] = { { 0 } }; |
| int var[CDEF_NBLOCKS][CDEF_NBLOCKS] = { { 0 } }; |
| int stride; |
| int mi_wide_l2[3]; |
| int mi_high_l2[3]; |
| int xdec[3]; |
| int ydec[3]; |
| int pli; |
| int cdef_left; |
| int coeff_shift = AOMMAX(cm->bit_depth - 8, 0); |
| int nplanes = MAX_MB_PLANE; |
| int chroma_cdef = xd->plane[1].subsampling_x == xd->plane[1].subsampling_y && |
| xd->plane[2].subsampling_x == xd->plane[2].subsampling_y; |
| nvfb = (cm->mi_rows + MI_SIZE_64X64 - 1) / MI_SIZE_64X64; |
| nhfb = (cm->mi_cols + MI_SIZE_64X64 - 1) / MI_SIZE_64X64; |
| av1_setup_dst_planes(xd->plane, cm->sb_size, frame, 0, 0); |
| row_cdef = aom_malloc(sizeof(*row_cdef) * (nhfb + 2) * 2); |
| memset(row_cdef, 1, sizeof(*row_cdef) * (nhfb + 2) * 2); |
| prev_row_cdef = row_cdef + 1; |
| curr_row_cdef = prev_row_cdef + nhfb + 2; |
| for (pli = 0; pli < nplanes; pli++) { |
| xdec[pli] = xd->plane[pli].subsampling_x; |
| ydec[pli] = xd->plane[pli].subsampling_y; |
| mi_wide_l2[pli] = MI_SIZE_LOG2 - xd->plane[pli].subsampling_x; |
| mi_high_l2[pli] = MI_SIZE_LOG2 - xd->plane[pli].subsampling_y; |
| if (xdec[pli] != ydec[pli]) nplanes = 1; |
| } |
| stride = (cm->mi_cols << MI_SIZE_LOG2) + 2 * CDEF_HBORDER; |
| for (pli = 0; pli < nplanes; pli++) { |
| linebuf[pli] = aom_malloc(sizeof(*linebuf) * CDEF_VBORDER * stride); |
| colbuf[pli] = |
| aom_malloc(sizeof(*colbuf) * |
| ((CDEF_BLOCKSIZE << mi_high_l2[pli]) + 2 * CDEF_VBORDER) * |
| CDEF_HBORDER); |
| } |
| for (fbr = 0; fbr < nvfb; fbr++) { |
| for (pli = 0; pli < nplanes; pli++) { |
| const int block_height = |
| (MI_SIZE_64X64 << mi_high_l2[pli]) + 2 * CDEF_VBORDER; |
| fill_rect(colbuf[pli], CDEF_HBORDER, block_height, CDEF_HBORDER, |
| CDEF_VERY_LARGE); |
| } |
| cdef_left = 1; |
| for (fbc = 0; fbc < nhfb; fbc++) { |
| int level, sec_strength; |
| int uv_level, uv_sec_strength; |
| int nhb, nvb; |
| int cstart = 0; |
| curr_row_cdef[fbc] = 0; |
| if (cm->mi_grid_visible[MI_SIZE_64X64 * fbr * cm->mi_stride + |
| MI_SIZE_64X64 * fbc] == NULL || |
| cm->mi_grid_visible[MI_SIZE_64X64 * fbr * cm->mi_stride + |
| MI_SIZE_64X64 * fbc] |
| ->mbmi.cdef_strength == -1) { |
| cdef_left = 0; |
| continue; |
| } |
| if (!cdef_left) cstart = -CDEF_HBORDER; |
| nhb = AOMMIN(MI_SIZE_64X64, cm->mi_cols - MI_SIZE_64X64 * fbc); |
| nvb = AOMMIN(MI_SIZE_64X64, cm->mi_rows - MI_SIZE_64X64 * fbr); |
| int tile_top, tile_left, tile_bottom, tile_right; |
| int mi_idx = MI_SIZE_64X64 * fbr * cm->mi_stride + MI_SIZE_64X64 * fbc; |
| MODE_INFO *const mi_tl = cm->mi + mi_idx; |
| BOUNDARY_TYPE boundary_tl = mi_tl->mbmi.boundary_info; |
| tile_top = boundary_tl & TILE_ABOVE_BOUNDARY; |
| tile_left = boundary_tl & TILE_LEFT_BOUNDARY; |
| |
| if (fbr != nvfb - 1 && |
| (&cm->mi[mi_idx + (MI_SIZE_64X64 - 1) * cm->mi_stride])) |
| tile_bottom = cm->mi[mi_idx + (MI_SIZE_64X64 - 1) * cm->mi_stride] |
| .mbmi.boundary_info & |
| TILE_BOTTOM_BOUNDARY; |
| else |
| tile_bottom = 1; |
| |
| if (fbc != nhfb - 1 && (&cm->mi[mi_idx + MI_SIZE_64X64 - 1])) |
| tile_right = cm->mi[mi_idx + MI_SIZE_64X64 - 1].mbmi.boundary_info & |
| TILE_RIGHT_BOUNDARY; |
| else |
| tile_right = 1; |
| |
| const int mbmi_cdef_strength = |
| cm->mi_grid_visible[MI_SIZE_64X64 * fbr * cm->mi_stride + |
| MI_SIZE_64X64 * fbc] |
| ->mbmi.cdef_strength; |
| level = cm->cdef_strengths[mbmi_cdef_strength] / CDEF_SEC_STRENGTHS; |
| sec_strength = |
| cm->cdef_strengths[mbmi_cdef_strength] % CDEF_SEC_STRENGTHS; |
| sec_strength += sec_strength == 3; |
| uv_level = cm->cdef_uv_strengths[mbmi_cdef_strength] / CDEF_SEC_STRENGTHS; |
| uv_sec_strength = |
| cm->cdef_uv_strengths[mbmi_cdef_strength] % CDEF_SEC_STRENGTHS; |
| uv_sec_strength += uv_sec_strength == 3; |
| if ((level == 0 && sec_strength == 0 && uv_level == 0 && |
| uv_sec_strength == 0) || |
| (cdef_count = sb_compute_cdef_list( |
| cm, fbr * MI_SIZE_64X64, fbc * MI_SIZE_64X64, dlist, |
| #if CONFIG_CDEF_SINGLEPASS |
| (level & 1) || (uv_level & 1))) == 0) |
| #else |
| get_filter_skip(level) || get_filter_skip(uv_level))) == 0) |
| #endif |
| { |
| cdef_left = 0; |
| continue; |
| } |
| |
| curr_row_cdef[fbc] = 1; |
| for (pli = 0; pli < nplanes; pli++) { |
| #if !CONFIG_CDEF_SINGLEPASS |
| DECLARE_ALIGNED(16, uint16_t, dst[CDEF_BLOCKSIZE * CDEF_BLOCKSIZE]); |
| #endif |
| int coffset; |
| int rend, cend; |
| int pri_damping = cm->cdef_pri_damping; |
| int sec_damping = cm->cdef_sec_damping; |
| int hsize = nhb << mi_wide_l2[pli]; |
| int vsize = nvb << mi_high_l2[pli]; |
| |
| if (pli) { |
| if (chroma_cdef) |
| level = uv_level; |
| else |
| level = 0; |
| sec_strength = uv_sec_strength; |
| } |
| |
| if (fbc == nhfb - 1) |
| cend = hsize; |
| else |
| cend = hsize + CDEF_HBORDER; |
| |
| if (fbr == nvfb - 1) |
| rend = vsize; |
| else |
| rend = vsize + CDEF_VBORDER; |
| |
| coffset = fbc * MI_SIZE_64X64 << mi_wide_l2[pli]; |
| if (fbc == nhfb - 1) { |
| /* On the last superblock column, fill in the right border with |
| CDEF_VERY_LARGE to avoid filtering with the outside. */ |
| fill_rect(&src[cend + CDEF_HBORDER], CDEF_BSTRIDE, |
| rend + CDEF_VBORDER, hsize + CDEF_HBORDER - cend, |
| CDEF_VERY_LARGE); |
| } |
| if (fbr == nvfb - 1) { |
| /* On the last superblock row, fill in the bottom border with |
| CDEF_VERY_LARGE to avoid filtering with the outside. */ |
| fill_rect(&src[(rend + CDEF_VBORDER) * CDEF_BSTRIDE], CDEF_BSTRIDE, |
| CDEF_VBORDER, hsize + 2 * CDEF_HBORDER, CDEF_VERY_LARGE); |
| } |
| /* Copy in the pixels we need from the current superblock for |
| deringing.*/ |
| copy_sb8_16(cm, |
| &src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER + cstart], |
| CDEF_BSTRIDE, xd->plane[pli].dst.buf, |
| (MI_SIZE_64X64 << mi_high_l2[pli]) * fbr, coffset + cstart, |
| xd->plane[pli].dst.stride, rend, cend - cstart); |
| if (!prev_row_cdef[fbc]) { |
| copy_sb8_16(cm, &src[CDEF_HBORDER], CDEF_BSTRIDE, |
| xd->plane[pli].dst.buf, |
| (MI_SIZE_64X64 << mi_high_l2[pli]) * fbr - CDEF_VBORDER, |
| coffset, xd->plane[pli].dst.stride, CDEF_VBORDER, hsize); |
| } else if (fbr > 0) { |
| copy_rect(&src[CDEF_HBORDER], CDEF_BSTRIDE, &linebuf[pli][coffset], |
| stride, CDEF_VBORDER, hsize); |
| } else { |
| fill_rect(&src[CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER, hsize, |
| CDEF_VERY_LARGE); |
| } |
| if (!prev_row_cdef[fbc - 1]) { |
| copy_sb8_16(cm, src, CDEF_BSTRIDE, xd->plane[pli].dst.buf, |
| (MI_SIZE_64X64 << mi_high_l2[pli]) * fbr - CDEF_VBORDER, |
| coffset - CDEF_HBORDER, xd->plane[pli].dst.stride, |
| CDEF_VBORDER, CDEF_HBORDER); |
| } else if (fbr > 0 && fbc > 0) { |
| copy_rect(src, CDEF_BSTRIDE, &linebuf[pli][coffset - CDEF_HBORDER], |
| stride, CDEF_VBORDER, CDEF_HBORDER); |
| } else { |
| fill_rect(src, CDEF_BSTRIDE, CDEF_VBORDER, CDEF_HBORDER, |
| CDEF_VERY_LARGE); |
| } |
| if (!prev_row_cdef[fbc + 1]) { |
| copy_sb8_16(cm, &src[CDEF_HBORDER + (nhb << mi_wide_l2[pli])], |
| CDEF_BSTRIDE, xd->plane[pli].dst.buf, |
| (MI_SIZE_64X64 << mi_high_l2[pli]) * fbr - CDEF_VBORDER, |
| coffset + hsize, xd->plane[pli].dst.stride, CDEF_VBORDER, |
| CDEF_HBORDER); |
| } else if (fbr > 0 && fbc < nhfb - 1) { |
| copy_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE, |
| &linebuf[pli][coffset + hsize], stride, CDEF_VBORDER, |
| CDEF_HBORDER); |
| } else { |
| fill_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE, CDEF_VBORDER, |
| CDEF_HBORDER, CDEF_VERY_LARGE); |
| } |
| if (cdef_left) { |
| /* If we deringed the superblock on the left then we need to copy in |
| saved pixels. */ |
| copy_rect(src, CDEF_BSTRIDE, colbuf[pli], CDEF_HBORDER, |
| rend + CDEF_VBORDER, CDEF_HBORDER); |
| } |
| /* Saving pixels in case we need to dering the superblock on the |
| right. */ |
| copy_rect(colbuf[pli], CDEF_HBORDER, src + hsize, CDEF_BSTRIDE, |
| rend + CDEF_VBORDER, CDEF_HBORDER); |
| copy_sb8_16( |
| cm, &linebuf[pli][coffset], stride, xd->plane[pli].dst.buf, |
| (MI_SIZE_64X64 << mi_high_l2[pli]) * (fbr + 1) - CDEF_VBORDER, |
| coffset, xd->plane[pli].dst.stride, CDEF_VBORDER, hsize); |
| |
| if (tile_top) { |
| fill_rect(src, CDEF_BSTRIDE, CDEF_VBORDER, hsize + 2 * CDEF_HBORDER, |
| CDEF_VERY_LARGE); |
| } |
| if (tile_left) { |
| fill_rect(src, CDEF_BSTRIDE, vsize + 2 * CDEF_VBORDER, CDEF_HBORDER, |
| CDEF_VERY_LARGE); |
| } |
| if (tile_bottom) { |
| fill_rect(&src[(vsize + CDEF_VBORDER) * CDEF_BSTRIDE], CDEF_BSTRIDE, |
| CDEF_VBORDER, hsize + 2 * CDEF_HBORDER, CDEF_VERY_LARGE); |
| } |
| if (tile_right) { |
| fill_rect(&src[hsize + CDEF_HBORDER], CDEF_BSTRIDE, |
| vsize + 2 * CDEF_VBORDER, CDEF_HBORDER, CDEF_VERY_LARGE); |
| } |
| #if CONFIG_HIGHBITDEPTH |
| if (cm->use_highbitdepth) { |
| cdef_filter_fb( |
| #if CONFIG_CDEF_SINGLEPASS |
| NULL, |
| &CONVERT_TO_SHORTPTR(xd->plane[pli].dst.buf) |
| #else |
| (uint8_t *)&CONVERT_TO_SHORTPTR(xd->plane[pli].dst.buf) |
| #endif |
| [xd->plane[pli].dst.stride * |
| (MI_SIZE_64X64 * fbr << mi_high_l2[pli]) + |
| (fbc * MI_SIZE_64X64 << mi_wide_l2[pli])], |
| #if CONFIG_CDEF_SINGLEPASS |
| xd->plane[pli].dst.stride, |
| #else |
| xd->plane[pli].dst.stride, dst, |
| #endif |
| &src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER], xdec[pli], |
| ydec[pli], dir, NULL, var, pli, dlist, cdef_count, level, |
| #if CONFIG_CDEF_SINGLEPASS |
| sec_strength, pri_damping, sec_damping, coeff_shift); |
| #else |
| sec_strength, sec_damping, pri_damping, coeff_shift, 0, 1); |
| #endif |
| } else { |
| #endif |
| cdef_filter_fb( |
| &xd->plane[pli] |
| .dst.buf[xd->plane[pli].dst.stride * |
| (MI_SIZE_64X64 * fbr << mi_high_l2[pli]) + |
| (fbc * MI_SIZE_64X64 << mi_wide_l2[pli])], |
| #if CONFIG_CDEF_SINGLEPASS |
| NULL, xd->plane[pli].dst.stride, |
| #else |
| xd->plane[pli].dst.stride, dst, |
| #endif |
| &src[CDEF_VBORDER * CDEF_BSTRIDE + CDEF_HBORDER], xdec[pli], |
| ydec[pli], dir, NULL, var, pli, dlist, cdef_count, level, |
| #if CONFIG_CDEF_SINGLEPASS |
| sec_strength, pri_damping, sec_damping, coeff_shift); |
| #else |
| sec_strength, sec_damping, pri_damping, coeff_shift, 0, 0); |
| #endif |
| |
| #if CONFIG_HIGHBITDEPTH |
| } |
| #endif |
| } |
| cdef_left = 1; |
| } |
| { |
| unsigned char *tmp; |
| tmp = prev_row_cdef; |
| prev_row_cdef = curr_row_cdef; |
| curr_row_cdef = tmp; |
| } |
| } |
| aom_free(row_cdef); |
| for (pli = 0; pli < nplanes; pli++) { |
| aom_free(linebuf[pli]); |
| aom_free(colbuf[pli]); |
| } |
| } |