summaryrefslogtreecommitdiffstats
path: root/third_party/aom/av1/common/cdef.c
diff options
context:
space:
mode:
Diffstat (limited to 'third_party/aom/av1/common/cdef.c')
-rw-r--r--third_party/aom/av1/common/cdef.c445
1 files changed, 445 insertions, 0 deletions
diff --git a/third_party/aom/av1/common/cdef.c b/third_party/aom/av1/common/cdef.c
new file mode 100644
index 000000000..53dff98b7
--- /dev/null
+++ b/third_party/aom/av1/common/cdef.c
@@ -0,0 +1,445 @@
+/*
+ * Copyright (c) 2016, Alliance for Open Media. All rights reserved
+ *
+ * This source code is subject to the terms of the BSD 2 Clause License and
+ * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
+ * was not distributed with this source code in the LICENSE file, you can
+ * obtain it at www.aomedia.org/license/software. If the Alliance for Open
+ * Media Patent License 1.0 was not distributed with this source code in the
+ * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
+ */
+
+#include <assert.h>
+#include <math.h>
+#include <string.h>
+
+#include "./aom_scale_rtcd.h"
+#include "aom/aom_integer.h"
+#include "av1/common/cdef.h"
+#include "av1/common/od_dering.h"
+#include "av1/common/onyxc_int.h"
+#include "av1/common/reconinter.h"
+
+int sb_all_skip(const AV1_COMMON *const cm, int mi_row, int mi_col) {
+ int r, c;
+ int maxc, maxr;
+ int skip = 1;
+ maxc = cm->mi_cols - mi_col;
+ maxr = cm->mi_rows - mi_row;
+#if CONFIG_EXT_PARTITION
+ if (maxr > cm->mib_size_log2) maxr = cm->mib_size_log2;
+ if (maxc > cm->mib_size_log2) maxc = cm->mib_size_log2;
+#else
+ if (maxr > MAX_MIB_SIZE) maxr = MAX_MIB_SIZE;
+ if (maxc > MAX_MIB_SIZE) maxc = MAX_MIB_SIZE;
+#endif
+
+ for (r = 0; r < maxr; r++) {
+ for (c = 0; c < maxc; c++) {
+ skip = skip &&
+ cm->mi_grid_visible[(mi_row + r) * cm->mi_stride + mi_col + c]
+ ->mbmi.skip;
+ }
+ }
+ return skip;
+}
+
+static int is_8x8_block_skip(MODE_INFO **grid, int mi_row, int mi_col,
+ int mi_stride) {
+ int is_skip = 1;
+ for (int r = 0; r < mi_size_high[BLOCK_8X8]; ++r)
+ for (int c = 0; c < mi_size_wide[BLOCK_8X8]; ++c)
+ is_skip &= grid[(mi_row + r) * mi_stride + (mi_col + c)]->mbmi.skip;
+
+ return is_skip;
+}
+
+int sb_compute_dering_list(const AV1_COMMON *const cm, int mi_row, int mi_col,
+ dering_list *dlist, int filter_skip) {
+ int r, c;
+ int maxc, maxr;
+ MODE_INFO **grid;
+ int count = 0;
+ grid = cm->mi_grid_visible;
+ maxc = cm->mi_cols - mi_col;
+ maxr = cm->mi_rows - mi_row;
+#if CONFIG_EXT_PARTITION
+ if (maxr > cm->mib_size_log2) maxr = cm->mib_size_log2;
+ if (maxc > cm->mib_size_log2) maxc = cm->mib_size_log2;
+#else
+ if (maxr > MAX_MIB_SIZE) maxr = MAX_MIB_SIZE;
+ if (maxc > MAX_MIB_SIZE) maxc = MAX_MIB_SIZE;
+#endif
+
+ const int r_step = mi_size_high[BLOCK_8X8];
+ const int c_step = mi_size_wide[BLOCK_8X8];
+ const int r_shift = (r_step == 2);
+ const int c_shift = (c_step == 2);
+
+ assert(r_step == 1 || r_step == 2);
+ assert(c_step == 1 || c_step == 2);
+
+ if (filter_skip) {
+ for (r = 0; r < maxr; r += r_step) {
+ for (c = 0; c < maxc; c += c_step) {
+ dlist[count].by = r >> r_shift;
+ dlist[count].bx = c >> c_shift;
+ dlist[count].skip =
+ is_8x8_block_skip(grid, mi_row + r, mi_col + c, cm->mi_stride);
+ count++;
+ }
+ }
+ } else {
+ for (r = 0; r < maxr; r += r_step) {
+ for (c = 0; c < maxc; c += c_step) {
+ if (!is_8x8_block_skip(grid, mi_row + r, mi_col + c, cm->mi_stride)) {
+ dlist[count].by = r >> r_shift;
+ dlist[count].bx = c >> c_shift;
+ dlist[count].skip = 0;
+ count++;
+ }
+ }
+ }
+ }
+ return count;
+}
+
+void copy_rect8_8bit_to_16bit_c(uint16_t *dst, int dstride, const uint8_t *src,
+ int sstride, int v, int h) {
+ int i, j;
+ for (i = 0; i < v; i++) {
+ for (j = 0; j < h; j++) {
+ dst[i * dstride + j] = src[i * sstride + j];
+ }
+ }
+}
+
+void copy_rect8_16bit_to_16bit_c(uint16_t *dst, int dstride,
+ const uint16_t *src, int sstride, int v,
+ int h) {
+ int i, j;
+ for (i = 0; i < v; i++) {
+ for (j = 0; j < h; j++) {
+ dst[i * dstride + j] = src[i * sstride + j];
+ }
+ }
+}
+
+void copy_sb8_16(UNUSED AV1_COMMON *cm, uint16_t *dst, int dstride,
+ const uint8_t *src, int src_voffset, int src_hoffset,
+ int sstride, int vsize, int hsize) {
+#if CONFIG_HIGHBITDEPTH
+ if (cm->use_highbitdepth) {
+ const uint16_t *base =
+ &CONVERT_TO_SHORTPTR(src)[src_voffset * sstride + src_hoffset];
+ copy_rect8_16bit_to_16bit(dst, dstride, base, sstride, vsize, hsize);
+ } else {
+#endif
+ const uint8_t *base = &src[src_voffset * sstride + src_hoffset];
+ copy_rect8_8bit_to_16bit(dst, dstride, base, sstride, vsize, hsize);
+#if CONFIG_HIGHBITDEPTH
+ }
+#endif
+}
+
+static INLINE void fill_rect(uint16_t *dst, int dstride, int v, int h,
+ uint16_t x) {
+ int i, j;
+ for (i = 0; i < v; i++) {
+ for (j = 0; j < h; j++) {
+ dst[i * dstride + j] = x;
+ }
+ }
+}
+
+static INLINE void copy_rect(uint16_t *dst, int dstride, const uint16_t *src,
+ int sstride, int v, int h) {
+ int i, j;
+ for (i = 0; i < v; i++) {
+ for (j = 0; j < h; j++) {
+ dst[i * dstride + j] = src[i * sstride + j];
+ }
+ }
+}
+
+void av1_cdef_frame(YV12_BUFFER_CONFIG *frame, AV1_COMMON *cm,
+ MACROBLOCKD *xd) {
+ int sbr, sbc;
+ int nhsb, nvsb;
+ uint16_t src[OD_DERING_INBUF_SIZE];
+ uint16_t *linebuf[3];
+ uint16_t *colbuf[3];
+ dering_list dlist[MAX_MIB_SIZE * MAX_MIB_SIZE];
+ unsigned char *row_dering, *prev_row_dering, *curr_row_dering;
+ int dering_count;
+ int dir[OD_DERING_NBLOCKS][OD_DERING_NBLOCKS] = { { 0 } };
+ int var[OD_DERING_NBLOCKS][OD_DERING_NBLOCKS] = { { 0 } };
+ int stride;
+ int mi_wide_l2[3];
+ int mi_high_l2[3];
+ int xdec[3];
+ int ydec[3];
+ int pli;
+ int dering_left;
+ int coeff_shift = AOMMAX(cm->bit_depth - 8, 0);
+ int nplanes = 3;
+ int chroma_dering =
+ xd->plane[1].subsampling_x == xd->plane[1].subsampling_y &&
+ xd->plane[2].subsampling_x == xd->plane[2].subsampling_y;
+ nvsb = (cm->mi_rows + MAX_MIB_SIZE - 1) / MAX_MIB_SIZE;
+ nhsb = (cm->mi_cols + MAX_MIB_SIZE - 1) / MAX_MIB_SIZE;
+ av1_setup_dst_planes(xd->plane, cm->sb_size, frame, 0, 0);
+ row_dering = aom_malloc(sizeof(*row_dering) * (nhsb + 2) * 2);
+ memset(row_dering, 1, sizeof(*row_dering) * (nhsb + 2) * 2);
+ prev_row_dering = row_dering + 1;
+ curr_row_dering = prev_row_dering + nhsb + 2;
+ for (pli = 0; pli < nplanes; pli++) {
+ xdec[pli] = xd->plane[pli].subsampling_x;
+ ydec[pli] = xd->plane[pli].subsampling_y;
+ mi_wide_l2[pli] = MI_SIZE_LOG2 - xd->plane[pli].subsampling_x;
+ mi_high_l2[pli] = MI_SIZE_LOG2 - xd->plane[pli].subsampling_y;
+ }
+ stride = (cm->mi_cols << MI_SIZE_LOG2) + 2 * OD_FILT_HBORDER;
+ for (pli = 0; pli < nplanes; pli++) {
+ linebuf[pli] = aom_malloc(sizeof(*linebuf) * OD_FILT_VBORDER * stride);
+ colbuf[pli] =
+ aom_malloc(sizeof(*colbuf) *
+ ((MAX_SB_SIZE << mi_high_l2[pli]) + 2 * OD_FILT_VBORDER) *
+ OD_FILT_HBORDER);
+ }
+ for (sbr = 0; sbr < nvsb; sbr++) {
+ for (pli = 0; pli < nplanes; pli++) {
+ const int block_height =
+ (MAX_MIB_SIZE << mi_high_l2[pli]) + 2 * OD_FILT_VBORDER;
+ fill_rect(colbuf[pli], OD_FILT_HBORDER, block_height, OD_FILT_HBORDER,
+ OD_DERING_VERY_LARGE);
+ }
+ dering_left = 1;
+ for (sbc = 0; sbc < nhsb; sbc++) {
+ int level, clpf_strength;
+ int uv_level, uv_clpf_strength;
+ int nhb, nvb;
+ int cstart = 0;
+ curr_row_dering[sbc] = 0;
+ if (cm->mi_grid_visible[MAX_MIB_SIZE * sbr * cm->mi_stride +
+ MAX_MIB_SIZE * sbc] == NULL ||
+ cm->mi_grid_visible[MAX_MIB_SIZE * sbr * cm->mi_stride +
+ MAX_MIB_SIZE * sbc]
+ ->mbmi.cdef_strength == -1) {
+ dering_left = 0;
+ continue;
+ }
+ if (!dering_left) cstart = -OD_FILT_HBORDER;
+ nhb = AOMMIN(MAX_MIB_SIZE, cm->mi_cols - MAX_MIB_SIZE * sbc);
+ nvb = AOMMIN(MAX_MIB_SIZE, cm->mi_rows - MAX_MIB_SIZE * sbr);
+ int tile_top, tile_left, tile_bottom, tile_right;
+ int mi_idx = MAX_MIB_SIZE * sbr * cm->mi_stride + MAX_MIB_SIZE * sbc;
+ BOUNDARY_TYPE boundary_tl =
+ cm->mi_grid_visible[MAX_MIB_SIZE * sbr * cm->mi_stride +
+ MAX_MIB_SIZE * sbc]
+ ->mbmi.boundary_info;
+ tile_top = boundary_tl & TILE_ABOVE_BOUNDARY;
+ tile_left = boundary_tl & TILE_LEFT_BOUNDARY;
+ /* Right and bottom information appear unreliable, so we use the top
+ and left flags for the next superblocks. */
+ if (sbr != nvsb - 1 &&
+ cm->mi_grid_visible[mi_idx + MAX_MIB_SIZE * cm->mi_stride])
+ tile_bottom = cm->mi_grid_visible[mi_idx + MAX_MIB_SIZE * cm->mi_stride]
+ ->mbmi.boundary_info &
+ TILE_ABOVE_BOUNDARY;
+ else
+ tile_bottom = 1;
+ if (sbc != nhsb - 1 && cm->mi_grid_visible[mi_idx + MAX_MIB_SIZE])
+ tile_right =
+ cm->mi_grid_visible[mi_idx + MAX_MIB_SIZE]->mbmi.boundary_info &
+ TILE_LEFT_BOUNDARY;
+ else
+ tile_right = 1;
+ const int mbmi_cdef_strength =
+ cm->mi_grid_visible[MAX_MIB_SIZE * sbr * cm->mi_stride +
+ MAX_MIB_SIZE * sbc]
+ ->mbmi.cdef_strength;
+ level = cm->cdef_strengths[mbmi_cdef_strength] / CLPF_STRENGTHS;
+ clpf_strength = cm->cdef_strengths[mbmi_cdef_strength] % CLPF_STRENGTHS;
+ clpf_strength += clpf_strength == 3;
+ uv_level = cm->cdef_uv_strengths[mbmi_cdef_strength] / CLPF_STRENGTHS;
+ uv_clpf_strength =
+ cm->cdef_uv_strengths[mbmi_cdef_strength] % CLPF_STRENGTHS;
+ uv_clpf_strength += uv_clpf_strength == 3;
+ if ((level == 0 && clpf_strength == 0 && uv_level == 0 &&
+ uv_clpf_strength == 0) ||
+ (dering_count = sb_compute_dering_list(
+ cm, sbr * MAX_MIB_SIZE, sbc * MAX_MIB_SIZE, dlist,
+ get_filter_skip(level) || get_filter_skip(uv_level))) == 0) {
+ dering_left = 0;
+ continue;
+ }
+
+ curr_row_dering[sbc] = 1;
+ for (pli = 0; pli < nplanes; pli++) {
+ uint16_t dst[MAX_SB_SIZE * MAX_SB_SIZE];
+ int coffset;
+ int rend, cend;
+ int clpf_damping = cm->cdef_clpf_damping;
+ int dering_damping = cm->cdef_dering_damping;
+ int hsize = nhb << mi_wide_l2[pli];
+ int vsize = nvb << mi_high_l2[pli];
+
+ if (pli) {
+ if (chroma_dering)
+ level = uv_level;
+ else
+ level = 0;
+ clpf_strength = uv_clpf_strength;
+ }
+
+ if (sbc == nhsb - 1)
+ cend = hsize;
+ else
+ cend = hsize + OD_FILT_HBORDER;
+
+ if (sbr == nvsb - 1)
+ rend = vsize;
+ else
+ rend = vsize + OD_FILT_VBORDER;
+
+ coffset = sbc * MAX_MIB_SIZE << mi_wide_l2[pli];
+ if (sbc == nhsb - 1) {
+ /* On the last superblock column, fill in the right border with
+ OD_DERING_VERY_LARGE to avoid filtering with the outside. */
+ fill_rect(&src[cend + OD_FILT_HBORDER], OD_FILT_BSTRIDE,
+ rend + OD_FILT_VBORDER, hsize + OD_FILT_HBORDER - cend,
+ OD_DERING_VERY_LARGE);
+ }
+ if (sbr == nvsb - 1) {
+ /* On the last superblock row, fill in the bottom border with
+ OD_DERING_VERY_LARGE to avoid filtering with the outside. */
+ fill_rect(&src[(rend + OD_FILT_VBORDER) * OD_FILT_BSTRIDE],
+ OD_FILT_BSTRIDE, OD_FILT_VBORDER,
+ hsize + 2 * OD_FILT_HBORDER, OD_DERING_VERY_LARGE);
+ }
+ /* Copy in the pixels we need from the current superblock for
+ deringing.*/
+ copy_sb8_16(
+ cm,
+ &src[OD_FILT_VBORDER * OD_FILT_BSTRIDE + OD_FILT_HBORDER + cstart],
+ OD_FILT_BSTRIDE, xd->plane[pli].dst.buf,
+ (MAX_MIB_SIZE << mi_high_l2[pli]) * sbr, coffset + cstart,
+ xd->plane[pli].dst.stride, rend, cend - cstart);
+ if (!prev_row_dering[sbc]) {
+ copy_sb8_16(cm, &src[OD_FILT_HBORDER], OD_FILT_BSTRIDE,
+ xd->plane[pli].dst.buf,
+ (MAX_MIB_SIZE << mi_high_l2[pli]) * sbr - OD_FILT_VBORDER,
+ coffset, xd->plane[pli].dst.stride, OD_FILT_VBORDER,
+ hsize);
+ } else if (sbr > 0) {
+ copy_rect(&src[OD_FILT_HBORDER], OD_FILT_BSTRIDE,
+ &linebuf[pli][coffset], stride, OD_FILT_VBORDER, hsize);
+ } else {
+ fill_rect(&src[OD_FILT_HBORDER], OD_FILT_BSTRIDE, OD_FILT_VBORDER,
+ hsize, OD_DERING_VERY_LARGE);
+ }
+ if (!prev_row_dering[sbc - 1]) {
+ copy_sb8_16(cm, src, OD_FILT_BSTRIDE, xd->plane[pli].dst.buf,
+ (MAX_MIB_SIZE << mi_high_l2[pli]) * sbr - OD_FILT_VBORDER,
+ coffset - OD_FILT_HBORDER, xd->plane[pli].dst.stride,
+ OD_FILT_VBORDER, OD_FILT_HBORDER);
+ } else if (sbr > 0 && sbc > 0) {
+ copy_rect(src, OD_FILT_BSTRIDE,
+ &linebuf[pli][coffset - OD_FILT_HBORDER], stride,
+ OD_FILT_VBORDER, OD_FILT_HBORDER);
+ } else {
+ fill_rect(src, OD_FILT_BSTRIDE, OD_FILT_VBORDER, OD_FILT_HBORDER,
+ OD_DERING_VERY_LARGE);
+ }
+ if (!prev_row_dering[sbc + 1]) {
+ copy_sb8_16(cm, &src[OD_FILT_HBORDER + (nhb << mi_wide_l2[pli])],
+ OD_FILT_BSTRIDE, xd->plane[pli].dst.buf,
+ (MAX_MIB_SIZE << mi_high_l2[pli]) * sbr - OD_FILT_VBORDER,
+ coffset + hsize, xd->plane[pli].dst.stride,
+ OD_FILT_VBORDER, OD_FILT_HBORDER);
+ } else if (sbr > 0 && sbc < nhsb - 1) {
+ copy_rect(&src[hsize + OD_FILT_HBORDER], OD_FILT_BSTRIDE,
+ &linebuf[pli][coffset + hsize], stride, OD_FILT_VBORDER,
+ OD_FILT_HBORDER);
+ } else {
+ fill_rect(&src[hsize + OD_FILT_HBORDER], OD_FILT_BSTRIDE,
+ OD_FILT_VBORDER, OD_FILT_HBORDER, OD_DERING_VERY_LARGE);
+ }
+ if (dering_left) {
+ /* If we deringed the superblock on the left then we need to copy in
+ saved pixels. */
+ copy_rect(src, OD_FILT_BSTRIDE, colbuf[pli], OD_FILT_HBORDER,
+ rend + OD_FILT_VBORDER, OD_FILT_HBORDER);
+ }
+ /* Saving pixels in case we need to dering the superblock on the
+ right. */
+ copy_rect(colbuf[pli], OD_FILT_HBORDER, src + hsize, OD_FILT_BSTRIDE,
+ rend + OD_FILT_VBORDER, OD_FILT_HBORDER);
+ copy_sb8_16(
+ cm, &linebuf[pli][coffset], stride, xd->plane[pli].dst.buf,
+ (MAX_MIB_SIZE << mi_high_l2[pli]) * (sbr + 1) - OD_FILT_VBORDER,
+ coffset, xd->plane[pli].dst.stride, OD_FILT_VBORDER, hsize);
+
+ if (tile_top) {
+ fill_rect(src, OD_FILT_BSTRIDE, OD_FILT_VBORDER,
+ hsize + 2 * OD_FILT_HBORDER, OD_DERING_VERY_LARGE);
+ }
+ if (tile_left) {
+ fill_rect(src, OD_FILT_BSTRIDE, vsize + 2 * OD_FILT_VBORDER,
+ OD_FILT_HBORDER, OD_DERING_VERY_LARGE);
+ }
+ if (tile_bottom) {
+ fill_rect(&src[(vsize + OD_FILT_VBORDER) * OD_FILT_BSTRIDE],
+ OD_FILT_BSTRIDE, OD_FILT_VBORDER,
+ hsize + 2 * OD_FILT_HBORDER, OD_DERING_VERY_LARGE);
+ }
+ if (tile_right) {
+ fill_rect(&src[hsize + OD_FILT_HBORDER], OD_FILT_BSTRIDE,
+ vsize + 2 * OD_FILT_VBORDER, OD_FILT_HBORDER,
+ OD_DERING_VERY_LARGE);
+ }
+#if CONFIG_HIGHBITDEPTH
+ if (cm->use_highbitdepth) {
+ od_dering(
+ (uint8_t *)&CONVERT_TO_SHORTPTR(
+ xd->plane[pli]
+ .dst.buf)[xd->plane[pli].dst.stride *
+ (MAX_MIB_SIZE * sbr << mi_high_l2[pli]) +
+ (sbc * MAX_MIB_SIZE << mi_wide_l2[pli])],
+ xd->plane[pli].dst.stride, dst,
+ &src[OD_FILT_VBORDER * OD_FILT_BSTRIDE + OD_FILT_HBORDER],
+ xdec[pli], ydec[pli], dir, NULL, var, pli, dlist, dering_count,
+ level, clpf_strength, clpf_damping, dering_damping, coeff_shift,
+ 0, 1);
+ } else {
+#endif
+ od_dering(&xd->plane[pli]
+ .dst.buf[xd->plane[pli].dst.stride *
+ (MAX_MIB_SIZE * sbr << mi_high_l2[pli]) +
+ (sbc * MAX_MIB_SIZE << mi_wide_l2[pli])],
+ xd->plane[pli].dst.stride, dst,
+ &src[OD_FILT_VBORDER * OD_FILT_BSTRIDE + OD_FILT_HBORDER],
+ xdec[pli], ydec[pli], dir, NULL, var, pli, dlist,
+ dering_count, level, clpf_strength, clpf_damping,
+ dering_damping, coeff_shift, 0, 0);
+
+#if CONFIG_HIGHBITDEPTH
+ }
+#endif
+ }
+ dering_left = 1;
+ }
+ {
+ unsigned char *tmp;
+ tmp = prev_row_dering;
+ prev_row_dering = curr_row_dering;
+ curr_row_dering = tmp;
+ }
+ }
+ aom_free(row_dering);
+ for (pli = 0; pli < nplanes; pli++) {
+ aom_free(linebuf[pli]);
+ aom_free(colbuf[pli]);
+ }
+}