blob: e00251619f99d8e3838d3a2b725f5d835dcad2f6 [file] [log] [blame]
/*
* Copyright (c) 2016, Alliance for Open Media. All rights reserved
*
* This source code is subject to the terms of the BSD 2 Clause License and
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
* was not distributed with this source code in the LICENSE file, you can
* obtain it at www.aomedia.org/license/software. If the Alliance for Open
* Media Patent License 1.0 was not distributed with this source code in the
* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
*/
#ifndef AOM_AV1_COMMON_CONVOLVE_H_
#define AOM_AV1_COMMON_CONVOLVE_H_
#include <stdbool.h>
#include "av1/common/filter.h"
#ifdef __cplusplus
extern "C" {
#endif
typedef uint16_t CONV_BUF_TYPE;
typedef struct ConvolveParams {
int do_average;
int filter_bits;
CONV_BUF_TYPE *dst;
int dst_stride;
int round_0;
int round_1;
int plane;
int is_compound;
int use_dist_wtd_comp_avg;
int fwd_offset;
int bck_offset;
} ConvolveParams;
#define NONSEP_PIXELS_MAX 32
#define NONSEP_COEFFS_MAX 32
#define NONSEP_ROW_ID 0
#define NONSEP_COL_ID 1
#define NONSEP_BUF_POS 2
static INLINE int16_t clip_base(int16_t x, int bit_depth) {
(void)bit_depth;
return x;
}
typedef struct NonsepFilterConfig {
int prec_bits;
int num_pixels;
int num_pixels2;
const int (*config)[3];
const int (*config2)[3];
int strict_bounds;
} NonsepFilterConfig;
// Nonseparable convolution
void av1_convolve_nonsep(const uint8_t *dgd, int width, int height, int stride,
const NonsepFilterConfig *config,
const int16_t *filter, uint8_t *dst, int dst_stride);
void av1_convolve_nonsep_highbd(const uint8_t *dgd, int width, int height,
int stride, const NonsepFilterConfig *config,
const int16_t *filter, uint8_t *dst,
int dst_stride, int bit_depth);
void av1_convolve_nonsep_mask(const uint8_t *dgd, int width, int height,
int stride, const NonsepFilterConfig *config,
const int16_t *filter, uint8_t *dst,
int dst_stride, const uint8_t *skip_mask,
int mask_stride);
void av1_convolve_nonsep_mask_highbd(const uint8_t *dgd, int width, int height,
int stride,
const NonsepFilterConfig *config,
const int16_t *filter, uint8_t *dst,
int dst_stride, int bit_depth,
const uint8_t *skip_mask, int mask_stride);
// Nonseparable convolution with dual input planes - used for cross component
// filtering
void av1_convolve_nonsep_dual(const uint8_t *dgd, int width, int height,
int stride, const uint8_t *dgd2, int stride2,
const NonsepFilterConfig *config,
const int16_t *filter, uint8_t *dst,
int dst_stride);
void av1_convolve_nonsep_dual_highbd(const uint8_t *dgd, int width, int height,
int stride, const uint8_t *dgd2,
int stride2,
const NonsepFilterConfig *config,
const int16_t *filter, uint8_t *dst,
int dst_stride, int bit_depth);
void av1_convolve_nonsep_dual_mask(const uint8_t *dgd, int width, int height,
int stride, const uint8_t *dgd2, int stride2,
const NonsepFilterConfig *config,
const int16_t *filter, uint8_t *dst,
int dst_stride, const uint8_t *skip_mask,
int mask_stride);
void av1_convolve_nonsep_dual_mask_highbd(
const uint8_t *dgd, int width, int height, int stride, const uint8_t *dgd2,
int stride2, const NonsepFilterConfig *config, const int16_t *filter,
uint8_t *dst, int dst_stride, int bit_depth, const uint8_t *skip_mask,
int mask_stride);
#if CONFIG_SUPERRES_TX64
// Nonseparable classified convolution with different filters used for each
// pixel based on its class as specified by supplied class map.
void av1_convolve_nonsep_cls(const uint8_t *dgd, int width, int height,
int stride, const NonsepFilterConfig *nsfilter,
const uint8_t *cls, int cls_stride,
const int16_t *filter, int filter_stride,
uint8_t *dst, int dst_stride);
void av1_convolve_nonsep_cls_highbd(const uint16_t *dgd, int width, int height,
int stride,
const NonsepFilterConfig *nsfilter,
const uint8_t *cls, int cls_stride,
const int16_t *filter, int filter_stride,
uint16_t *dst, int dst_stride,
int bit_depth);
#endif // CONFIG_SUPERRES_TX64
#define ROUND0_BITS 3
#define COMPOUND_ROUND1_BITS 7
#define WIENER_ROUND0_BITS 3
#define WIENER_CLAMP_LIMIT(fb, r0, bd) (1 << ((bd) + 1 + (fb) - (r0)))
typedef void (*aom_convolve_fn_t)(const uint8_t *src, int src_stride,
uint8_t *dst, int dst_stride, int w, int h,
const InterpFilterParams *filter_params_x,
const InterpFilterParams *filter_params_y,
const int subpel_x_qn, const int subpel_y_qn,
ConvolveParams *conv_params);
typedef void (*aom_highbd_convolve_fn_t)(
const uint16_t *src, int src_stride, uint16_t *dst, int dst_stride, int w,
int h, const InterpFilterParams *filter_params_x,
const InterpFilterParams *filter_params_y, const int subpel_x_qn,
const int subpel_y_qn, ConvolveParams *conv_params, int bd);
struct AV1Common;
struct scale_factors;
void av1_convolve_2d_facade(const uint8_t *src, int src_stride, uint8_t *dst,
int dst_stride, int w, int h, int orig_w,
int orig_h, int_interpfilters interp_filters,
const int subpel_x_qn, int x_step_q4,
const int subpel_y_qn, int y_step_q4, int scaled,
ConvolveParams *conv_params, int is_intrabc);
static INLINE ConvolveParams get_conv_params_no_round(int do_average, int plane,
CONV_BUF_TYPE *dst,
int dst_stride,
int is_compound, int bd) {
ConvolveParams conv_params;
conv_params.do_average = do_average;
assert(IMPLIES(do_average, is_compound));
conv_params.filter_bits = FILTER_BITS;
conv_params.is_compound = is_compound;
conv_params.round_0 = ROUND0_BITS;
conv_params.round_1 = is_compound ? COMPOUND_ROUND1_BITS
: 2 * FILTER_BITS - conv_params.round_0;
const int intbufrange = bd + FILTER_BITS - conv_params.round_0 + 2;
assert(IMPLIES(bd < 12, intbufrange <= 16));
if (intbufrange > 16) {
conv_params.round_0 += intbufrange - 16;
if (!is_compound) conv_params.round_1 -= intbufrange - 16;
}
// TODO(yunqing): The following dst should only be valid while
// is_compound = 1;
conv_params.dst = dst;
conv_params.dst_stride = dst_stride;
conv_params.plane = plane;
return conv_params;
}
static INLINE ConvolveParams get_conv_params(int do_average, int plane,
int bd) {
return get_conv_params_no_round(do_average, plane, NULL, 0, 0, bd);
}
static INLINE ConvolveParams get_conv_params_wiener(int bd, int filter_bits) {
ConvolveParams conv_params;
(void)bd;
conv_params.filter_bits = filter_bits;
conv_params.do_average = 0;
conv_params.is_compound = 0;
conv_params.round_0 = WIENER_ROUND0_BITS;
conv_params.round_1 = 2 * filter_bits - conv_params.round_0;
const int intbufrange = bd + filter_bits - conv_params.round_0 + 2;
assert(IMPLIES(bd < 12, intbufrange <= 16));
if (intbufrange > 16) {
conv_params.round_0 += intbufrange - 16;
conv_params.round_1 -= intbufrange - 16;
}
conv_params.dst = NULL;
conv_params.dst_stride = 0;
conv_params.plane = 0;
return conv_params;
}
#if CONFIG_WIENER_SEP_HIPREC
static INLINE ConvolveParams get_conv_params_wiener_hp(int bd,
int filter_bits) {
ConvolveParams conv_params;
(void)bd;
conv_params.filter_bits = filter_bits;
conv_params.do_average = 0;
conv_params.is_compound = 0;
conv_params.round_0 = WIENER_ROUND0_BITS + filter_bits - FILTER_BITS;
conv_params.round_1 = 2 * filter_bits - conv_params.round_0;
const int intbufrange = bd + filter_bits - conv_params.round_0 + 2;
assert(IMPLIES(bd < 12, intbufrange <= 16));
if (intbufrange > 16) {
conv_params.round_0 += intbufrange - 16;
conv_params.round_1 -= intbufrange - 16;
}
conv_params.dst = NULL;
conv_params.dst_stride = 0;
conv_params.plane = 0;
return conv_params;
}
#endif // CONFIG_WIENER_SEP_HIPREC
void av1_highbd_convolve_2d_facade(
const uint8_t *src8, int src_stride, uint8_t *dst, int dst_stride, int w,
int h, int orig_w, int orig_h, int_interpfilters interp_filters,
const int subpel_x_qn, int x_step_q4, const int subpel_y_qn, int y_step_q4,
int scaled, ConvolveParams *conv_params, int is_intrabc, int bd);
// TODO(sarahparker) This will need to be integerized and optimized
void av1_convolve_2d_sobel_y_c(const uint8_t *src, int src_stride, double *dst,
int dst_stride, int w, int h, int dir,
double norm);
#ifdef __cplusplus
} // extern "C"
#endif
#endif // AOM_AV1_COMMON_CONVOLVE_H_