| /* |
| * Copyright (c) 2021, Alliance for Open Media. All rights reserved |
| * |
| * This source code is subject to the terms of the BSD 3-Clause Clear License |
| * and the Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear |
| * License was not distributed with this source code in the LICENSE file, you |
| * can obtain it at aomedia.org/license/software-license/bsd-3-c-c/. If the |
| * Alliance for Open Media Patent License 1.0 was not distributed with this |
| * source code in the PATENTS file, you can obtain it at |
| * aomedia.org/license/patent-license/. |
| */ |
| |
| #include <assert.h> |
| #include "aom_dsp/entdec.h" |
| #include "aom_dsp/prob.h" |
| |
| /*A range decoder. |
| This is an entropy decoder based upon \cite{Mar79}, which is itself a |
| rediscovery of the FIFO arithmetic code introduced by \cite{Pas76}. |
| It is very similar to arithmetic encoding, except that encoding is done with |
| digits in any base, instead of with bits, and so it is faster when using |
| larger bases (i.e.: a byte). |
| The author claims an average waste of $\frac{1}{2}\log_b(2b)$ bits, where $b$ |
| is the base, longer than the theoretical optimum, but to my knowledge there |
| is no published justification for this claim. |
| This only seems true when using near-infinite precision arithmetic so that |
| the process is carried out with no rounding errors. |
| |
| An excellent description of implementation details is available at |
| http://www.arturocampos.com/ac_range.html |
| A recent work \cite{MNW98} which proposes several changes to arithmetic |
| encoding for efficiency actually re-discovers many of the principles |
| behind range encoding, and presents a good theoretical analysis of them. |
| |
| End of stream is handled by writing out the smallest number of bits that |
| ensures that the stream will be correctly decoded regardless of the value of |
| any subsequent bits. |
| od_ec_dec_tell() can be used to determine how many bits were needed to decode |
| all the symbols thus far; other data can be packed in the remaining bits of |
| the input buffer. |
| @PHDTHESIS{Pas76, |
| author="Richard Clark Pasco", |
| title="Source coding algorithms for fast data compression", |
| school="Dept. of Electrical Engineering, Stanford University", |
| address="Stanford, CA", |
| month=May, |
| year=1976, |
| URL="http://www.richpasco.org/scaffdc.pdf" |
| } |
| @INPROCEEDINGS{Mar79, |
| author="Martin, G.N.N.", |
| title="Range encoding: an algorithm for removing redundancy from a digitised |
| message", |
| booktitle="Video & Data Recording Conference", |
| year=1979, |
| address="Southampton", |
| month=Jul, |
| URL="http://www.compressconsult.com/rangecoder/rngcod.pdf.gz" |
| } |
| @ARTICLE{MNW98, |
| author="Alistair Moffat and Radford Neal and Ian H. Witten", |
| title="Arithmetic Coding Revisited", |
| journal="{ACM} Transactions on Information Systems", |
| year=1998, |
| volume=16, |
| number=3, |
| pages="256--294", |
| month=Jul, |
| URL="http://researchcommons.waikato.ac.nz/bitstream/handle/10289/78/content.pdf" |
| }*/ |
| |
| /*This is meant to be a large, positive constant that can still be efficiently |
| loaded as an immediate (on platforms like ARM, for example). |
| Even relatively modest values like 100 would work fine.*/ |
| #define OD_EC_LOTS_OF_BITS (0x4000) |
| |
| /* Minimum # of preloaded bits to maintain in od_ec_window. */ |
| #if CONFIG_BYPASS_IMPROVEMENT |
| #define OD_EC_MIN_BITS 8 |
| #else |
| #define OD_EC_MIN_BITS 0 |
| #endif // CONFIG_BYPASS_IMPROVEMENT |
| |
| /*The return value of od_ec_dec_tell does not change across an od_ec_dec_refill |
| call.*/ |
| static void od_ec_dec_refill(od_ec_dec *dec) { |
| int s; |
| od_ec_window dif; |
| int16_t cnt; |
| const unsigned char *bptr; |
| const unsigned char *end; |
| dif = dec->dif; |
| cnt = dec->cnt; |
| bptr = dec->bptr; |
| end = dec->end; |
| s = OD_EC_WINDOW_SIZE - 9 - (cnt + 15); |
| for (; s >= 0 && bptr < end; s -= 8, bptr++) { |
| /*Each time a byte is inserted into the window (dif), bptr advances and cnt |
| is incremented by 8, so the total number of consumed bits (the return |
| value of od_ec_dec_tell) does not change.*/ |
| assert(s <= OD_EC_WINDOW_SIZE - 8); |
| dif ^= (od_ec_window)bptr[0] << s; |
| cnt += 8; |
| } |
| if (bptr >= end) { |
| /*We've reached the end of the buffer. It is perfectly valid for us to need |
| to fill the window with additional bits past the end of the buffer (and |
| this happens in normal operation). These bits should all just be taken |
| as zero. But we cannot increment bptr past 'end' (this is undefined |
| behavior), so we start to increment dec->tell_offs. We also don't want |
| to keep testing bptr against 'end', so we set cnt to OD_EC_LOTS_OF_BITS |
| and adjust dec->tell_offs so that the total number of unconsumed bits in |
| the window (dec->cnt - dec->tell_offs) does not change. This effectively |
| puts lots of zero bits into the window, and means we won't try to refill |
| it from the buffer for a very long time (at which point we'll put lots |
| of zero bits into the window again).*/ |
| dec->tell_offs += OD_EC_LOTS_OF_BITS - cnt; |
| cnt = OD_EC_LOTS_OF_BITS; |
| } |
| dec->dif = dif; |
| dec->cnt = cnt; |
| dec->bptr = bptr; |
| } |
| |
| /*Takes updated dif and range values, renormalizes them so that |
| 32768 <= rng < 65536 (reading more bytes from the stream into dif if |
| necessary), and stores them back in the decoder context. |
| dif: The new value of dif. |
| rng: The new value of the range. |
| ret: The value to return. |
| Return: ret. |
| This allows the compiler to jump to this function via a tail-call.*/ |
| static int od_ec_dec_normalize(od_ec_dec *dec, od_ec_window dif, unsigned rng, |
| int ret) { |
| int d; |
| assert(rng <= 65535U); |
| /*The number of leading zeros in the 16-bit binary representation of rng.*/ |
| d = 16 - OD_ILOG_NZ(rng); |
| /*d bits in dec->dif are consumed.*/ |
| dec->cnt -= d; |
| /*This is equivalent to shifting in 1's instead of 0's.*/ |
| dec->dif = ((dif + 1) << d) - 1; |
| dec->rng = rng << d; |
| if (dec->cnt < OD_EC_MIN_BITS) od_ec_dec_refill(dec); |
| return ret; |
| } |
| |
| #if CONFIG_BYPASS_IMPROVEMENT |
| /* This function performs renormalization after decoding bypass symbols. |
| This is a simplified version of od_ec_dec_normalize(), as bypass |
| symbol decoding only requires shifting in new bits, and the range |
| value remains unchanged. */ |
| static int od_ec_dec_bypass_normalize(od_ec_dec *dec, od_ec_window dif, |
| int n_bypass, int ret) { |
| /*n_bypass bits in dec->dif are consumed.*/ |
| dec->cnt -= n_bypass; |
| /*This is equivalent to shifting in 1's instead of 0's.*/ |
| dec->dif = ((dif + 1) << n_bypass) - 1; |
| if (dec->cnt < OD_EC_MIN_BITS) od_ec_dec_refill(dec); |
| return ret; |
| } |
| |
| // Scale the CDF to match the range value stored in the entropy decoder. |
| static INLINE unsigned od_ec_prob_scale(uint16_t p, unsigned r, int n) { |
| return (((r >> 8) * (uint32_t)(p >> EC_PROB_SHIFT) >> |
| (7 - EC_PROB_SHIFT - CDF_SHIFT + 1)) |
| << 1) + |
| EC_MIN_PROB * n; |
| } |
| #endif // CONFIG_BYPASS_IMPROVEMENT |
| |
| /*Initializes the decoder. |
| buf: The input buffer to use. |
| storage: The size in bytes of the input buffer.*/ |
| void od_ec_dec_init(od_ec_dec *dec, const unsigned char *buf, |
| uint32_t storage) { |
| dec->buf = buf; |
| dec->end = buf + storage; |
| dec->bptr = buf; |
| dec->dif = ((od_ec_window)1 << (OD_EC_WINDOW_SIZE - 1)) - 1; |
| dec->rng = 0x8000; |
| dec->cnt = -15; |
| dec->tell_offs = dec->cnt + 1; |
| od_ec_dec_refill(dec); |
| } |
| |
| /*Decode a single binary value. |
| f: The probability that the bit is one, scaled by 32768. |
| Return: The value decoded (0 or 1).*/ |
| int od_ec_decode_bool_q15(od_ec_dec *dec, unsigned f) { |
| od_ec_window dif; |
| od_ec_window vw; |
| unsigned r; |
| unsigned r_new; |
| unsigned v; |
| int ret; |
| assert(0 < f); |
| assert(f < 32768U); |
| dif = dec->dif; |
| r = dec->rng; |
| assert(dif >> (OD_EC_WINDOW_SIZE - 16) < r); |
| assert(32768U <= r); |
| #if CONFIG_BYPASS_IMPROVEMENT |
| v = od_ec_prob_scale(f, r, 1); |
| #else |
| v = ((r >> 8) * (uint32_t)(f >> EC_PROB_SHIFT) >> (7 - EC_PROB_SHIFT)); |
| v += EC_MIN_PROB; |
| #endif |
| vw = (od_ec_window)v << (OD_EC_WINDOW_SIZE - 16); |
| ret = 1; |
| r_new = v; |
| if (dif >= vw) { |
| r_new = r - v; |
| dif -= vw; |
| ret = 0; |
| } |
| return od_ec_dec_normalize(dec, dif, r_new, ret); |
| } |
| |
| #if CONFIG_BYPASS_IMPROVEMENT |
| /*Decode a single binary value, with 50/50 probability. |
| Return: The value decoded (0 or 1).*/ |
| int od_ec_decode_bool_bypass(od_ec_dec *dec) { |
| return od_ec_decode_literal_bypass(dec, 1); |
| } |
| |
| /*Decode a literal of n_bits |
| n_bits: Number of bits to decode 1..8 |
| Return: The value decoded (0..2^n_bits-1).*/ |
| int od_ec_decode_literal_bypass(od_ec_dec *dec, int n_bits) { |
| od_ec_window dif; |
| od_ec_window vw; |
| unsigned r; |
| int ret; |
| dif = dec->dif; |
| r = dec->rng; |
| assert((r & 1) == 0); |
| assert(dif >> (OD_EC_WINDOW_SIZE - 16) < r); |
| assert(32768U <= r); |
| assert(0 < n_bits && n_bits <= 32); |
| vw = (od_ec_window)r << (OD_EC_WINDOW_SIZE - 16); |
| ret = 0; |
| for (int bit = 0; bit < n_bits; bit++) { |
| vw >>= 1; |
| ret <<= 1; |
| if (dif >= vw) { |
| dif -= vw; |
| } else { |
| ret |= 1; |
| } |
| } |
| return od_ec_dec_bypass_normalize(dec, dif, n_bits, ret); |
| } |
| |
| /*Decode unary-coded symbol. |
| max_bits: Max number of decoded bits. |
| Return: The value decoded (0..2^n_bits-1).*/ |
| OD_WARN_UNUSED_RESULT int od_ec_decode_unary_bypass(od_ec_dec *dec, |
| int max_bits) |
| OD_ARG_NONNULL(1); |
| int od_ec_decode_unary_bypass(od_ec_dec *dec, int max_bits) { |
| if (dec->cnt < max_bits - 1) od_ec_dec_refill(dec); |
| od_ec_window dif; |
| od_ec_window vw; |
| unsigned r; |
| int ret; |
| dif = dec->dif; |
| r = dec->rng; |
| assert((r & 1) == 0); |
| assert(dif >> (OD_EC_WINDOW_SIZE - 16) < r); |
| assert(32768U <= r); |
| assert((0 < max_bits) && (max_bits <= 32)); |
| vw = (od_ec_window)r << (OD_EC_WINDOW_SIZE - 16); |
| ret = 0; |
| int bit; |
| for (bit = 0; bit < max_bits; bit++) { |
| vw >>= 1; |
| if (dif >= vw) { |
| dif -= vw; |
| ret++; |
| } else { |
| bit++; |
| break; |
| } |
| } |
| return od_ec_dec_bypass_normalize(dec, dif, bit, ret); |
| } |
| #endif // CONFIG_BYPASS_IMPROVEMENT |
| |
| /*Decodes a symbol given an inverse cumulative distribution function (CDF) |
| table in Q15. |
| icdf: CDF_PROB_TOP minus the CDF, such that symbol s falls in the range |
| [s > 0 ? (CDF_PROB_TOP - icdf[s - 1]) : 0, CDF_PROB_TOP - icdf[s]). |
| The values must be monotonically non-increasing, and icdf[nsyms - 1] |
| must be 0. |
| nsyms: The number of symbols in the alphabet. |
| This should be at most 16. |
| Return: The decoded symbol s.*/ |
| int od_ec_decode_cdf_q15(od_ec_dec *dec, const uint16_t *icdf, int nsyms) { |
| od_ec_window dif; |
| unsigned r; |
| unsigned c; |
| unsigned u; |
| unsigned v; |
| int ret; |
| (void)nsyms; |
| dif = dec->dif; |
| r = dec->rng; |
| const int N = nsyms - 1; |
| |
| assert(dif >> (OD_EC_WINDOW_SIZE - 16) < r); |
| assert(icdf[nsyms - 1] == OD_ICDF(CDF_PROB_TOP)); |
| assert(32768U <= r); |
| assert(7 - EC_PROB_SHIFT - CDF_SHIFT >= 0); |
| c = (unsigned)(dif >> (OD_EC_WINDOW_SIZE - 16)); |
| v = r; |
| ret = -1; |
| do { |
| u = v; |
| #if CONFIG_BYPASS_IMPROVEMENT |
| ret++; |
| v = od_ec_prob_scale(icdf[ret], r, N - ret); |
| #else |
| v = ((r >> 8) * (uint32_t)(icdf[++ret] >> EC_PROB_SHIFT) >> |
| (7 - EC_PROB_SHIFT - CDF_SHIFT)); |
| v += EC_MIN_PROB * (N - ret); |
| #endif // CONFIG_BYPASS_IMPROVEMENT |
| } while (c < v); |
| assert(v < u); |
| assert(u <= r); |
| r = u - v; |
| dif -= (od_ec_window)v << (OD_EC_WINDOW_SIZE - 16); |
| return od_ec_dec_normalize(dec, dif, r, ret); |
| } |
| |
| /*Returns the number of bits "used" by the decoded symbols so far. |
| This same number can be computed in either the encoder or the decoder, and is |
| suitable for making coding decisions. |
| Return: The number of bits. |
| This will always be slightly larger than the exact value (e.g., all |
| rounding error is in the positive direction).*/ |
| int od_ec_dec_tell(const od_ec_dec *dec) { |
| /*There is a window of bits stored in dec->dif. The difference |
| (dec->bptr - dec->buf) tells us how many bytes have been read into this |
| window. The difference (dec->cnt - dec->tell_offs) tells us how many of |
| the bits in that window remain unconsumed.*/ |
| return (int)((dec->bptr - dec->buf) * 8 - dec->cnt + dec->tell_offs); |
| } |
| |
| /*Returns the number of bits "used" by the decoded symbols so far. |
| This same number can be computed in either the encoder or the decoder, and is |
| suitable for making coding decisions. |
| Return: The number of bits scaled by 2**OD_BITRES. |
| This will always be slightly larger than the exact value (e.g., all |
| rounding error is in the positive direction).*/ |
| uint64_t od_ec_dec_tell_frac(const od_ec_dec *dec) { |
| return od_ec_tell_frac(od_ec_dec_tell(dec), dec->rng); |
| } |