blob: c3d794ed8a111a504a7fe17c57bdfb59db8dda34 [file] [log] [blame]
Yaowu Xuc27fc142016-08-22 16:08:15 -07001/*
Yaowu Xu2ab7ff02016-09-02 12:04:54 -07002 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
Yaowu Xuc27fc142016-08-22 16:08:15 -07003 *
Yaowu Xu2ab7ff02016-09-02 12:04:54 -07004 * This source code is subject to the terms of the BSD 2 Clause License and
5 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6 * was not distributed with this source code in the LICENSE file, you can
7 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8 * Media Patent License 1.0 was not distributed with this source code in the
9 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
Yaowu Xuc27fc142016-08-22 16:08:15 -070010 */
11
Yaowu Xuf883b422016-08-30 14:01:10 -070012#ifndef AOM_DSP_INV_TXFM_H_
13#define AOM_DSP_INV_TXFM_H_
Yaowu Xuc27fc142016-08-22 16:08:15 -070014
15#include <assert.h>
16
Yaowu Xuf883b422016-08-30 14:01:10 -070017#include "./aom_config.h"
Yaowu Xuc27fc142016-08-22 16:08:15 -070018#include "aom_dsp/txfm_common.h"
19#include "aom_ports/mem.h"
20
21#ifdef __cplusplus
22extern "C" {
23#endif
24
25static INLINE tran_high_t check_range(tran_high_t input) {
26#if CONFIG_COEFFICIENT_RANGE_CHECKING
Yaowu Xuf883b422016-08-30 14:01:10 -070027 // For valid AV1 input streams, intermediate stage coefficients should always
Yaowu Xuc27fc142016-08-22 16:08:15 -070028 // stay within the range of a signed 16 bit integer. Coefficients can go out
Yaowu Xuf883b422016-08-30 14:01:10 -070029 // of this range for invalid/corrupt AV1 streams. However, strictly checking
Yaowu Xuc27fc142016-08-22 16:08:15 -070030 // this range for every intermediate coefficient can burdensome for a decoder,
31 // therefore the following assertion is only enabled when configured with
32 // --enable-coefficient-range-checking.
33 assert(INT16_MIN <= input);
34 assert(input <= INT16_MAX);
35#endif // CONFIG_COEFFICIENT_RANGE_CHECKING
36 return input;
37}
38
39static INLINE tran_high_t dct_const_round_shift(tran_high_t input) {
40 tran_high_t rv = ROUND_POWER_OF_TWO(input, DCT_CONST_BITS);
41 return rv;
42}
43
Yaowu Xuf883b422016-08-30 14:01:10 -070044#if CONFIG_AOM_HIGHBITDEPTH
Yaowu Xuc27fc142016-08-22 16:08:15 -070045static INLINE tran_high_t highbd_check_range(tran_high_t input, int bd) {
46#if CONFIG_COEFFICIENT_RANGE_CHECKING
Yaowu Xuf883b422016-08-30 14:01:10 -070047 // For valid highbitdepth AV1 streams, intermediate stage coefficients will
Yaowu Xuc27fc142016-08-22 16:08:15 -070048 // stay within the ranges:
49 // - 8 bit: signed 16 bit integer
50 // - 10 bit: signed 18 bit integer
51 // - 12 bit: signed 20 bit integer
52 const int32_t int_max = (1 << (7 + bd)) - 1;
53 const int32_t int_min = -int_max - 1;
54 assert(int_min <= input);
55 assert(input <= int_max);
56 (void)int_min;
57#endif // CONFIG_COEFFICIENT_RANGE_CHECKING
58 (void)bd;
59 return input;
60}
61
62static INLINE tran_high_t highbd_dct_const_round_shift(tran_high_t input) {
63 tran_high_t rv = ROUND_POWER_OF_TWO(input, DCT_CONST_BITS);
64 return rv;
65}
Yaowu Xuf883b422016-08-30 14:01:10 -070066#endif // CONFIG_AOM_HIGHBITDEPTH
Yaowu Xuc27fc142016-08-22 16:08:15 -070067
68#if CONFIG_EMULATE_HARDWARE
69// When CONFIG_EMULATE_HARDWARE is 1 the transform performs a
70// non-normative method to handle overflows. A stream that causes
71// overflows in the inverse transform is considered invalid,
72// and a hardware implementer is free to choose any reasonable
73// method to handle overflows. However to aid in hardware
74// verification they can use a specific implementation of the
75// WRAPLOW() macro below that is identical to their intended
76// hardware implementation (and also use configure options to trigger
77// the C-implementation of the transform).
78//
79// The particular WRAPLOW implementation below performs strict
80// overflow wrapping to match common hardware implementations.
81// bd of 8 uses trans_low with 16bits, need to remove 16bits
82// bd of 10 uses trans_low with 18bits, need to remove 14bits
83// bd of 12 uses trans_low with 20bits, need to remove 12bits
84// bd of x uses trans_low with 8+x bits, need to remove 24-x bits
85
86#define WRAPLOW(x) ((((int32_t)check_range(x)) << 16) >> 16)
Yaowu Xuf883b422016-08-30 14:01:10 -070087#if CONFIG_AOM_HIGHBITDEPTH
Yaowu Xuc27fc142016-08-22 16:08:15 -070088#define HIGHBD_WRAPLOW(x, bd) \
89 ((((int32_t)highbd_check_range((x), bd)) << (24 - bd)) >> (24 - bd))
Yaowu Xuf883b422016-08-30 14:01:10 -070090#endif // CONFIG_AOM_HIGHBITDEPTH
Yaowu Xuc27fc142016-08-22 16:08:15 -070091
92#else // CONFIG_EMULATE_HARDWARE
93
94#define WRAPLOW(x) ((int32_t)check_range(x))
Yaowu Xuf883b422016-08-30 14:01:10 -070095#if CONFIG_AOM_HIGHBITDEPTH
Yaowu Xuc27fc142016-08-22 16:08:15 -070096#define HIGHBD_WRAPLOW(x, bd) ((int32_t)highbd_check_range((x), bd))
Yaowu Xuf883b422016-08-30 14:01:10 -070097#endif // CONFIG_AOM_HIGHBITDEPTH
Yaowu Xuc27fc142016-08-22 16:08:15 -070098#endif // CONFIG_EMULATE_HARDWARE
99
Luca Barbatof0f98572016-09-03 12:14:15 +0200100void aom_idct4_c(const tran_low_t *input, tran_low_t *output);
101void aom_idct8_c(const tran_low_t *input, tran_low_t *output);
102void aom_idct16_c(const tran_low_t *input, tran_low_t *output);
103void aom_idct32_c(const tran_low_t *input, tran_low_t *output);
104void aom_iadst4_c(const tran_low_t *input, tran_low_t *output);
105void aom_iadst8_c(const tran_low_t *input, tran_low_t *output);
106void aom_iadst16_c(const tran_low_t *input, tran_low_t *output);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700107
Yaowu Xuf883b422016-08-30 14:01:10 -0700108#if CONFIG_AOM_HIGHBITDEPTH
109void aom_highbd_idct4_c(const tran_low_t *input, tran_low_t *output, int bd);
110void aom_highbd_idct8_c(const tran_low_t *input, tran_low_t *output, int bd);
111void aom_highbd_idct16_c(const tran_low_t *input, tran_low_t *output, int bd);
112void aom_highbd_idct32_c(const tran_low_t *input, tran_low_t *output, int bd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700113
Yaowu Xuf883b422016-08-30 14:01:10 -0700114void aom_highbd_iadst4_c(const tran_low_t *input, tran_low_t *output, int bd);
115void aom_highbd_iadst8_c(const tran_low_t *input, tran_low_t *output, int bd);
116void aom_highbd_iadst16_c(const tran_low_t *input, tran_low_t *output, int bd);
Yaowu Xuc27fc142016-08-22 16:08:15 -0700117
118static INLINE uint16_t highbd_clip_pixel_add(uint16_t dest, tran_high_t trans,
119 int bd) {
120 trans = HIGHBD_WRAPLOW(trans, bd);
121 return clip_pixel_highbd(dest + (int)trans, bd);
122}
123#endif
124
125static INLINE uint8_t clip_pixel_add(uint8_t dest, tran_high_t trans) {
126 trans = WRAPLOW(trans);
127 return clip_pixel(dest + (int)trans);
128}
129#ifdef __cplusplus
130} // extern "C"
131#endif
132
Yaowu Xuf883b422016-08-30 14:01:10 -0700133#endif // AOM_DSP_INV_TXFM_H_