495 строки
16 KiB
C
495 строки
16 KiB
C
/*
|
|
* Copyright (c) 2001-2016, Alliance for Open Media. All rights reserved
|
|
*
|
|
* This source code is subject to the terms of the BSD 2 Clause License and
|
|
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
|
|
* was not distributed with this source code in the LICENSE file, you can
|
|
* obtain it at www.aomedia.org/license/software. If the Alliance for Open
|
|
* Media Patent License 1.0 was not distributed with this source code in the
|
|
* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
|
|
*/
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
#include "./config.h"
|
|
#endif
|
|
|
|
#include "aom_dsp/entdec.h"
|
|
|
|
/*A range decoder.
|
|
This is an entropy decoder based upon \cite{Mar79}, which is itself a
|
|
rediscovery of the FIFO arithmetic code introduced by \cite{Pas76}.
|
|
It is very similar to arithmetic encoding, except that encoding is done with
|
|
digits in any base, instead of with bits, and so it is faster when using
|
|
larger bases (i.e.: a byte).
|
|
The author claims an average waste of $\frac{1}{2}\log_b(2b)$ bits, where $b$
|
|
is the base, longer than the theoretical optimum, but to my knowledge there
|
|
is no published justification for this claim.
|
|
This only seems true when using near-infinite precision arithmetic so that
|
|
the process is carried out with no rounding errors.
|
|
|
|
An excellent description of implementation details is available at
|
|
http://www.arturocampos.com/ac_range.html
|
|
A recent work \cite{MNW98} which proposes several changes to arithmetic
|
|
encoding for efficiency actually re-discovers many of the principles
|
|
behind range encoding, and presents a good theoretical analysis of them.
|
|
|
|
End of stream is handled by writing out the smallest number of bits that
|
|
ensures that the stream will be correctly decoded regardless of the value of
|
|
any subsequent bits.
|
|
od_ec_dec_tell() can be used to determine how many bits were needed to decode
|
|
all the symbols thus far; other data can be packed in the remaining bits of
|
|
the input buffer.
|
|
@PHDTHESIS{Pas76,
|
|
author="Richard Clark Pasco",
|
|
title="Source coding algorithms for fast data compression",
|
|
school="Dept. of Electrical Engineering, Stanford University",
|
|
address="Stanford, CA",
|
|
month=May,
|
|
year=1976,
|
|
URL="http://www.richpasco.org/scaffdc.pdf"
|
|
}
|
|
@INPROCEEDINGS{Mar79,
|
|
author="Martin, G.N.N.",
|
|
title="Range encoding: an algorithm for removing redundancy from a digitised
|
|
message",
|
|
booktitle="Video & Data Recording Conference",
|
|
year=1979,
|
|
address="Southampton",
|
|
month=Jul,
|
|
URL="http://www.compressconsult.com/rangecoder/rngcod.pdf.gz"
|
|
}
|
|
@ARTICLE{MNW98,
|
|
author="Alistair Moffat and Radford Neal and Ian H. Witten",
|
|
title="Arithmetic Coding Revisited",
|
|
journal="{ACM} Transactions on Information Systems",
|
|
year=1998,
|
|
volume=16,
|
|
number=3,
|
|
pages="256--294",
|
|
month=Jul,
|
|
URL="http://researchcommons.waikato.ac.nz/bitstream/handle/10289/78/content.pdf"
|
|
}*/
|
|
|
|
/*This is meant to be a large, positive constant that can still be efficiently
|
|
loaded as an immediate (on platforms like ARM, for example).
|
|
Even relatively modest values like 100 would work fine.*/
|
|
#define OD_EC_LOTS_OF_BITS (0x4000)
|
|
|
|
static void od_ec_dec_refill(od_ec_dec *dec) {
|
|
int s;
|
|
od_ec_window dif;
|
|
int16_t cnt;
|
|
const unsigned char *bptr;
|
|
const unsigned char *end;
|
|
dif = dec->dif;
|
|
cnt = dec->cnt;
|
|
bptr = dec->bptr;
|
|
end = dec->end;
|
|
s = OD_EC_WINDOW_SIZE - 9 - (cnt + 15);
|
|
for (; s >= 0 && bptr < end; s -= 8, bptr++) {
|
|
OD_ASSERT(s <= OD_EC_WINDOW_SIZE - 8);
|
|
dif |= (od_ec_window)bptr[0] << s;
|
|
cnt += 8;
|
|
}
|
|
if (bptr >= end) {
|
|
dec->tell_offs += OD_EC_LOTS_OF_BITS - cnt;
|
|
cnt = OD_EC_LOTS_OF_BITS;
|
|
}
|
|
dec->dif = dif;
|
|
dec->cnt = cnt;
|
|
dec->bptr = bptr;
|
|
}
|
|
|
|
/*Takes updated dif and range values, renormalizes them so that
|
|
32768 <= rng < 65536 (reading more bytes from the stream into dif if
|
|
necessary), and stores them back in the decoder context.
|
|
dif: The new value of dif.
|
|
rng: The new value of the range.
|
|
ret: The value to return.
|
|
Return: ret.
|
|
This allows the compiler to jump to this function via a tail-call.*/
|
|
static int od_ec_dec_normalize(od_ec_dec *dec, od_ec_window dif, unsigned rng,
|
|
int ret) {
|
|
int d;
|
|
OD_ASSERT(rng <= 65535U);
|
|
d = 16 - OD_ILOG_NZ(rng);
|
|
dec->cnt -= d;
|
|
dec->dif = dif << d;
|
|
dec->rng = rng << d;
|
|
if (dec->cnt < 0) od_ec_dec_refill(dec);
|
|
return ret;
|
|
}
|
|
|
|
/*Initializes the decoder.
|
|
buf: The input buffer to use.
|
|
Return: 0 on success, or a negative value on error.*/
|
|
void od_ec_dec_init(od_ec_dec *dec, const unsigned char *buf,
|
|
uint32_t storage) {
|
|
dec->buf = buf;
|
|
dec->eptr = buf + storage;
|
|
dec->end_window = 0;
|
|
dec->nend_bits = 0;
|
|
dec->tell_offs = 10 - (OD_EC_WINDOW_SIZE - 8);
|
|
dec->end = buf + storage;
|
|
dec->bptr = buf;
|
|
dec->dif = 0;
|
|
dec->rng = 0x8000;
|
|
dec->cnt = -15;
|
|
dec->error = 0;
|
|
od_ec_dec_refill(dec);
|
|
}
|
|
|
|
/*Decode a bit that has an fz/ft probability of being a zero.
|
|
fz: The probability that the bit is zero, scaled by _ft.
|
|
ft: The total probability.
|
|
This must be at least 16384 and no more than 32768.
|
|
Return: The value decoded (0 or 1).*/
|
|
int od_ec_decode_bool(od_ec_dec *dec, unsigned fz, unsigned ft) {
|
|
od_ec_window dif;
|
|
od_ec_window vw;
|
|
unsigned r;
|
|
int s;
|
|
unsigned v;
|
|
int ret;
|
|
OD_ASSERT(0 < fz);
|
|
OD_ASSERT(fz < ft);
|
|
OD_ASSERT(16384 <= ft);
|
|
OD_ASSERT(ft <= 32768U);
|
|
dif = dec->dif;
|
|
r = dec->rng;
|
|
OD_ASSERT(dif >> (OD_EC_WINDOW_SIZE - 16) < r);
|
|
OD_ASSERT(ft <= r);
|
|
s = r - ft >= ft;
|
|
ft <<= s;
|
|
fz <<= s;
|
|
OD_ASSERT(r - ft < ft);
|
|
#if OD_EC_REDUCED_OVERHEAD
|
|
{
|
|
unsigned d;
|
|
unsigned e;
|
|
d = r - ft;
|
|
e = OD_SUBSATU(2 * d, ft);
|
|
v = fz + OD_MINI(fz, e) + OD_MINI(OD_SUBSATU(fz, e) >> 1, d);
|
|
}
|
|
#else
|
|
v = fz + OD_MINI(fz, r - ft);
|
|
#endif
|
|
vw = (od_ec_window)v << (OD_EC_WINDOW_SIZE - 16);
|
|
ret = dif >= vw;
|
|
if (ret) dif -= vw;
|
|
r = ret ? r - v : v;
|
|
return od_ec_dec_normalize(dec, dif, r, ret);
|
|
}
|
|
|
|
/*Decode a bit that has an fz probability of being a zero in Q15.
|
|
This is a simpler, lower overhead version of od_ec_decode_bool() for use when
|
|
ft == 32768.
|
|
To be decoded properly by this function, symbols cannot have been encoded by
|
|
od_ec_encode(), but must have been encoded with one of the equivalent _q15()
|
|
or _dyadic() functions instead.
|
|
fz: The probability that the bit is zero, scaled by 32768.
|
|
Return: The value decoded (0 or 1).*/
|
|
int od_ec_decode_bool_q15(od_ec_dec *dec, unsigned fz) {
|
|
od_ec_window dif;
|
|
od_ec_window vw;
|
|
unsigned r;
|
|
unsigned r_new;
|
|
unsigned v;
|
|
int ret;
|
|
OD_ASSERT(0 < fz);
|
|
OD_ASSERT(fz < 32768U);
|
|
dif = dec->dif;
|
|
r = dec->rng;
|
|
OD_ASSERT(dif >> (OD_EC_WINDOW_SIZE - 16) < r);
|
|
OD_ASSERT(32768U <= r);
|
|
v = fz * (uint32_t)r >> 15;
|
|
vw = (od_ec_window)v << (OD_EC_WINDOW_SIZE - 16);
|
|
ret = 0;
|
|
r_new = v;
|
|
if (dif >= vw) {
|
|
r_new = r - v;
|
|
dif -= vw;
|
|
ret = 1;
|
|
}
|
|
return od_ec_dec_normalize(dec, dif, r_new, ret);
|
|
}
|
|
|
|
/*Decodes a symbol given a cumulative distribution function (CDF) table.
|
|
cdf: The CDF, such that symbol s falls in the range
|
|
[s > 0 ? cdf[s - 1] : 0, cdf[s]).
|
|
The values must be monotonically non-increasing, and cdf[nsyms - 1]
|
|
must be at least 16384, and no more than 32768.
|
|
nsyms: The number of symbols in the alphabet.
|
|
This should be at most 16.
|
|
Return: The decoded symbol s.*/
|
|
int od_ec_decode_cdf(od_ec_dec *dec, const uint16_t *cdf, int nsyms) {
|
|
od_ec_window dif;
|
|
unsigned r;
|
|
unsigned c;
|
|
unsigned d;
|
|
#if OD_EC_REDUCED_OVERHEAD
|
|
unsigned e;
|
|
#endif
|
|
int s;
|
|
unsigned u;
|
|
unsigned v;
|
|
unsigned q;
|
|
unsigned fl;
|
|
unsigned fh;
|
|
unsigned ft;
|
|
int ret;
|
|
dif = dec->dif;
|
|
r = dec->rng;
|
|
OD_ASSERT(dif >> (OD_EC_WINDOW_SIZE - 16) < r);
|
|
OD_ASSERT(nsyms > 0);
|
|
ft = cdf[nsyms - 1];
|
|
OD_ASSERT(16384 <= ft);
|
|
OD_ASSERT(ft <= 32768U);
|
|
OD_ASSERT(ft <= r);
|
|
s = r - ft >= ft;
|
|
ft <<= s;
|
|
d = r - ft;
|
|
OD_ASSERT(d < ft);
|
|
c = (unsigned)(dif >> (OD_EC_WINDOW_SIZE - 16));
|
|
q = OD_MAXI((int)(c >> 1), (int)(c - d));
|
|
#if OD_EC_REDUCED_OVERHEAD
|
|
e = OD_SUBSATU(2 * d, ft);
|
|
/*The correctness of this inverse partition function is not obvious, but it
|
|
was checked exhaustively for all possible values of r, ft, and c.
|
|
TODO: It should be possible to optimize this better than the compiler,
|
|
given that we do not care about the accuracy of negative results (as we
|
|
will not use them).
|
|
It would also be nice to get rid of the 32-bit dividend, as it requires a
|
|
32x32->64 bit multiply to invert.*/
|
|
q = OD_MAXI((int)q, (int)((2 * (int32_t)c + 1 - (int32_t)e) / 3));
|
|
#endif
|
|
q >>= s;
|
|
OD_ASSERT(q<ft>> s);
|
|
fl = 0;
|
|
ret = 0;
|
|
for (fh = cdf[ret]; fh <= q; fh = cdf[++ret]) fl = fh;
|
|
OD_ASSERT(fh <= ft >> s);
|
|
fl <<= s;
|
|
fh <<= s;
|
|
#if OD_EC_REDUCED_OVERHEAD
|
|
u = fl + OD_MINI(fl, e) + OD_MINI(OD_SUBSATU(fl, e) >> 1, d);
|
|
v = fh + OD_MINI(fh, e) + OD_MINI(OD_SUBSATU(fh, e) >> 1, d);
|
|
#else
|
|
u = fl + OD_MINI(fl, d);
|
|
v = fh + OD_MINI(fh, d);
|
|
#endif
|
|
r = v - u;
|
|
dif -= (od_ec_window)u << (OD_EC_WINDOW_SIZE - 16);
|
|
return od_ec_dec_normalize(dec, dif, r, ret);
|
|
}
|
|
|
|
/*Decodes a symbol given a cumulative distribution function (CDF) table.
|
|
cdf: The CDF, such that symbol s falls in the range
|
|
[s > 0 ? cdf[s - 1] : 0, cdf[s]).
|
|
The values must be monotonically non-increasing, and cdf[nsyms - 1]
|
|
must be at least 2, and no more than 32768.
|
|
nsyms: The number of symbols in the alphabet.
|
|
This should be at most 16.
|
|
Return: The decoded symbol s.*/
|
|
int od_ec_decode_cdf_unscaled(od_ec_dec *dec, const uint16_t *cdf, int nsyms) {
|
|
od_ec_window dif;
|
|
unsigned r;
|
|
unsigned c;
|
|
unsigned d;
|
|
#if OD_EC_REDUCED_OVERHEAD
|
|
unsigned e;
|
|
#endif
|
|
int s;
|
|
unsigned u;
|
|
unsigned v;
|
|
unsigned q;
|
|
unsigned fl;
|
|
unsigned fh;
|
|
unsigned ft;
|
|
int ret;
|
|
dif = dec->dif;
|
|
r = dec->rng;
|
|
OD_ASSERT(dif >> (OD_EC_WINDOW_SIZE - 16) < r);
|
|
OD_ASSERT(nsyms > 0);
|
|
ft = cdf[nsyms - 1];
|
|
OD_ASSERT(2 <= ft);
|
|
OD_ASSERT(ft <= 32768U);
|
|
s = 15 - OD_ILOG_NZ(ft - 1);
|
|
ft <<= s;
|
|
OD_ASSERT(ft <= r);
|
|
if (r - ft >= ft) {
|
|
ft <<= 1;
|
|
s++;
|
|
}
|
|
d = r - ft;
|
|
OD_ASSERT(d < ft);
|
|
c = (unsigned)(dif >> (OD_EC_WINDOW_SIZE - 16));
|
|
q = OD_MAXI((int)(c >> 1), (int)(c - d));
|
|
#if OD_EC_REDUCED_OVERHEAD
|
|
e = OD_SUBSATU(2 * d, ft);
|
|
/*TODO: See TODO above.*/
|
|
q = OD_MAXI((int)q, (int)((2 * (int32_t)c + 1 - (int32_t)e) / 3));
|
|
#endif
|
|
q >>= s;
|
|
OD_ASSERT(q<ft>> s);
|
|
fl = 0;
|
|
ret = 0;
|
|
for (fh = cdf[ret]; fh <= q; fh = cdf[++ret]) fl = fh;
|
|
OD_ASSERT(fh <= ft >> s);
|
|
fl <<= s;
|
|
fh <<= s;
|
|
#if OD_EC_REDUCED_OVERHEAD
|
|
u = fl + OD_MINI(fl, e) + OD_MINI(OD_SUBSATU(fl, e) >> 1, d);
|
|
v = fh + OD_MINI(fh, e) + OD_MINI(OD_SUBSATU(fh, e) >> 1, d);
|
|
#else
|
|
u = fl + OD_MINI(fl, d);
|
|
v = fh + OD_MINI(fh, d);
|
|
#endif
|
|
r = v - u;
|
|
dif -= (od_ec_window)u << (OD_EC_WINDOW_SIZE - 16);
|
|
return od_ec_dec_normalize(dec, dif, r, ret);
|
|
}
|
|
|
|
/*Decodes a symbol given a cumulative distribution function (CDF) table that
|
|
sums to a power of two.
|
|
This is a simpler, lower overhead version of od_ec_decode_cdf() for use when
|
|
cdf[nsyms - 1] is a power of two.
|
|
To be decoded properly by this function, symbols cannot have been encoded by
|
|
od_ec_encode(), but must have been encoded with one of the equivalent _q15()
|
|
functions instead.
|
|
cdf: The CDF, such that symbol s falls in the range
|
|
[s > 0 ? cdf[s - 1] : 0, cdf[s]).
|
|
The values must be monotonically non-increasing, and cdf[nsyms - 1]
|
|
must be exactly 1 << ftb.
|
|
nsyms: The number of symbols in the alphabet.
|
|
This should be at most 16.
|
|
ftb: The number of bits of precision in the cumulative distribution.
|
|
This must be no more than 15.
|
|
Return: The decoded symbol s.*/
|
|
int od_ec_decode_cdf_unscaled_dyadic(od_ec_dec *dec, const uint16_t *cdf,
|
|
int nsyms, unsigned ftb) {
|
|
od_ec_window dif;
|
|
unsigned r;
|
|
unsigned c;
|
|
unsigned u;
|
|
unsigned v;
|
|
int ret;
|
|
(void)nsyms;
|
|
dif = dec->dif;
|
|
r = dec->rng;
|
|
OD_ASSERT(dif >> (OD_EC_WINDOW_SIZE - 16) < r);
|
|
OD_ASSERT(ftb <= 15);
|
|
OD_ASSERT(cdf[nsyms - 1] == 1U << ftb);
|
|
OD_ASSERT(32768U <= r);
|
|
c = (unsigned)(dif >> (OD_EC_WINDOW_SIZE - 16));
|
|
v = 0;
|
|
ret = -1;
|
|
do {
|
|
u = v;
|
|
v = cdf[++ret] * (uint32_t)r >> ftb;
|
|
} while (v <= c);
|
|
OD_ASSERT(v <= r);
|
|
r = v - u;
|
|
dif -= (od_ec_window)u << (OD_EC_WINDOW_SIZE - 16);
|
|
return od_ec_dec_normalize(dec, dif, r, ret);
|
|
}
|
|
|
|
/*Decodes a symbol given a cumulative distribution function (CDF) table in Q15.
|
|
This is a simpler, lower overhead version of od_ec_decode_cdf() for use when
|
|
cdf[nsyms - 1] == 32768.
|
|
To be decoded properly by this function, symbols cannot have been encoded by
|
|
od_ec_encode(), but must have been encoded with one of the equivalent _q15()
|
|
or dyadic() functions instead.
|
|
cdf: The CDF, such that symbol s falls in the range
|
|
[s > 0 ? cdf[s - 1] : 0, cdf[s]).
|
|
The values must be monotonically non-increasing, and cdf[nsyms - 1]
|
|
must be 32768.
|
|
nsyms: The number of symbols in the alphabet.
|
|
This should be at most 16.
|
|
Return: The decoded symbol s.*/
|
|
int od_ec_decode_cdf_q15(od_ec_dec *dec, const uint16_t *cdf, int nsyms) {
|
|
return od_ec_decode_cdf_unscaled_dyadic(dec, cdf, nsyms, 15);
|
|
}
|
|
|
|
/*Extracts a raw unsigned integer with a non-power-of-2 range from the stream.
|
|
The integer must have been encoded with od_ec_enc_uint().
|
|
ft: The number of integers that can be decoded (one more than the max).
|
|
This must be at least 2, and no more than 2**29.
|
|
Return: The decoded bits.*/
|
|
uint32_t od_ec_dec_uint(od_ec_dec *dec, uint32_t ft) {
|
|
OD_ASSERT(ft >= 2);
|
|
OD_ASSERT(ft <= (uint32_t)1 << (25 + OD_EC_UINT_BITS));
|
|
if (ft > 1U << OD_EC_UINT_BITS) {
|
|
uint32_t t;
|
|
int ft1;
|
|
int ftb;
|
|
ft--;
|
|
ftb = OD_ILOG_NZ(ft) - OD_EC_UINT_BITS;
|
|
ft1 = (int)(ft >> ftb) + 1;
|
|
t = od_ec_decode_cdf_q15(dec, OD_UNIFORM_CDF_Q15(ft1), ft1);
|
|
t = t << ftb | od_ec_dec_bits(dec, ftb, "");
|
|
if (t <= ft) return t;
|
|
dec->error = 1;
|
|
return ft;
|
|
}
|
|
return od_ec_decode_cdf_q15(dec, OD_UNIFORM_CDF_Q15(ft), (int)ft);
|
|
}
|
|
|
|
/*Extracts a sequence of raw bits from the stream.
|
|
The bits must have been encoded with od_ec_enc_bits().
|
|
ftb: The number of bits to extract.
|
|
This must be between 0 and 25, inclusive.
|
|
Return: The decoded bits.*/
|
|
uint32_t od_ec_dec_bits_(od_ec_dec *dec, unsigned ftb) {
|
|
od_ec_window window;
|
|
int available;
|
|
uint32_t ret;
|
|
OD_ASSERT(ftb <= 25);
|
|
window = dec->end_window;
|
|
available = dec->nend_bits;
|
|
if ((unsigned)available < ftb) {
|
|
const unsigned char *buf;
|
|
const unsigned char *eptr;
|
|
buf = dec->buf;
|
|
eptr = dec->eptr;
|
|
OD_ASSERT(available <= OD_EC_WINDOW_SIZE - 8);
|
|
do {
|
|
if (eptr <= buf) {
|
|
dec->tell_offs += OD_EC_LOTS_OF_BITS - available;
|
|
available = OD_EC_LOTS_OF_BITS;
|
|
break;
|
|
}
|
|
window |= (od_ec_window) * --eptr << available;
|
|
available += 8;
|
|
} while (available <= OD_EC_WINDOW_SIZE - 8);
|
|
dec->eptr = eptr;
|
|
}
|
|
ret = (uint32_t)window & (((uint32_t)1 << ftb) - 1);
|
|
window >>= ftb;
|
|
available -= ftb;
|
|
dec->end_window = window;
|
|
dec->nend_bits = available;
|
|
return ret;
|
|
}
|
|
|
|
/*Returns the number of bits "used" by the decoded symbols so far.
|
|
This same number can be computed in either the encoder or the decoder, and is
|
|
suitable for making coding decisions.
|
|
Return: The number of bits.
|
|
This will always be slightly larger than the exact value (e.g., all
|
|
rounding error is in the positive direction).*/
|
|
int od_ec_dec_tell(const od_ec_dec *dec) {
|
|
return (int)(((dec->end - dec->eptr) + (dec->bptr - dec->buf)) * 8 -
|
|
dec->cnt - dec->nend_bits + dec->tell_offs);
|
|
}
|
|
|
|
/*Returns the number of bits "used" by the decoded symbols so far.
|
|
This same number can be computed in either the encoder or the decoder, and is
|
|
suitable for making coding decisions.
|
|
Return: The number of bits scaled by 2**OD_BITRES.
|
|
This will always be slightly larger than the exact value (e.g., all
|
|
rounding error is in the positive direction).*/
|
|
uint32_t od_ec_dec_tell_frac(const od_ec_dec *dec) {
|
|
return od_ec_tell_frac(od_ec_dec_tell(dec), dec->rng);
|
|
}
|