189 строки
6.2 KiB
C
189 строки
6.2 KiB
C
/*
|
|
* Copyright (c) 2001-2016, Alliance for Open Media. All rights reserved
|
|
*
|
|
* This source code is subject to the terms of the BSD 2 Clause License and
|
|
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
|
|
* was not distributed with this source code in the LICENSE file, you can
|
|
* obtain it at www.aomedia.org/license/software. If the Alliance for Open
|
|
* Media Patent License 1.0 was not distributed with this source code in the
|
|
* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
|
|
*/
|
|
|
|
/* clang-format off */
|
|
|
|
#if !defined(_pvq_H)
|
|
# define _pvq_H (1)
|
|
# include "generic_code.h"
|
|
# include "odintrin.h"
|
|
|
|
extern const uint16_t EXP_CDF_TABLE[][16];
|
|
extern const uint16_t LAPLACE_OFFSET[];
|
|
|
|
#if CONFIG_DAALA_DIST
|
|
#define AV1_PVQ_ENABLE_ACTIVITY_MASKING (1)
|
|
#else
|
|
#define AV1_PVQ_ENABLE_ACTIVITY_MASKING (0)
|
|
#endif
|
|
|
|
# define PVQ_MAX_PARTITIONS (1 + 3*(OD_TXSIZES-1))
|
|
|
|
# define OD_NOREF_ADAPT_SPEED (4)
|
|
/* Normalized lambda for PVQ quantizer. Since we normalize the gain by q, the
|
|
distortion is normalized by q^2 and lambda does not need the q^2 factor.
|
|
At high rate, this would be log(2)/6, but we're using a slightly more
|
|
aggressive value, closer to:
|
|
Li, Xiang, et al. "Laplace distribution based Lagrangian rate distortion
|
|
optimization for hybrid video coding." Circuits and Systems for Video
|
|
Technology, IEEE Transactions on 19.2 (2009): 193-205.
|
|
*/
|
|
# define OD_PVQ_LAMBDA (.1146)
|
|
|
|
#define OD_PVQ_SKIP_ZERO 1
|
|
#define OD_PVQ_SKIP_COPY 2
|
|
|
|
/* Maximum size for coding a PVQ band. */
|
|
#define OD_MAX_PVQ_SIZE (1024)
|
|
|
|
#if defined(OD_FLOAT_PVQ)
|
|
#define OD_QM_SHIFT (15)
|
|
#else
|
|
#define OD_QM_SHIFT (11)
|
|
#endif
|
|
#define OD_QM_SCALE (1 << OD_QM_SHIFT)
|
|
#if defined(OD_FLOAT_PVQ)
|
|
#define OD_QM_SCALE_1 (1./OD_QM_SCALE)
|
|
#endif
|
|
#define OD_QM_SCALE_MAX 32767
|
|
#define OD_QM_INV_SHIFT (12)
|
|
#define OD_QM_INV_SCALE (1 << OD_QM_INV_SHIFT)
|
|
#if defined(OD_FLOAT_PVQ)
|
|
#define OD_QM_INV_SCALE_1 (1./OD_QM_INV_SCALE)
|
|
#endif
|
|
#define OD_QM_OFFSET(bs) ((((1 << 2*bs) - 1) << 2*OD_LOG_BSIZE0)/3)
|
|
#define OD_QM_STRIDE (OD_QM_OFFSET(OD_TXSIZES))
|
|
#define OD_QM_BUFFER_SIZE (2*OD_QM_STRIDE)
|
|
|
|
#if !defined(OD_FLOAT_PVQ)
|
|
#define OD_THETA_SHIFT (15)
|
|
#define OD_THETA_SCALE ((1 << OD_THETA_SHIFT)*2./M_PI)
|
|
#define OD_MAX_THETA_SCALE (1 << OD_THETA_SHIFT)
|
|
#define OD_TRIG_SCALE (32768)
|
|
#define OD_BETA_SHIFT (12)
|
|
#define OD_BETA_SCALE_1 (1./(1 << OD_BETA_SHIFT))
|
|
/*Multiplies 16-bit a by 32-bit b and keeps bits [16:64-OD_BETA_SHIFT-1].*/
|
|
#define OD_MULT16_32_QBETA(a, b) \
|
|
((int16_t)(a)*(int64_t)(int32_t)(b) >> OD_BETA_SHIFT)
|
|
# define OD_MULT16_16_QBETA(a, b) \
|
|
((((int16_t)(a))*((int32_t)(int16_t)(b))) >> OD_BETA_SHIFT)
|
|
#define OD_CGAIN_SHIFT (8)
|
|
#define OD_CGAIN_SCALE (1 << OD_CGAIN_SHIFT)
|
|
#else
|
|
#define OD_BETA_SCALE_1 (1.)
|
|
#define OD_THETA_SCALE (1)
|
|
#define OD_TRIG_SCALE (1)
|
|
#define OD_CGAIN_SCALE (1)
|
|
#endif
|
|
#define OD_THETA_SCALE_1 (1./OD_THETA_SCALE)
|
|
#define OD_TRIG_SCALE_1 (1./OD_TRIG_SCALE)
|
|
#define OD_CGAIN_SCALE_1 (1./OD_CGAIN_SCALE)
|
|
#define OD_CGAIN_SCALE_2 (OD_CGAIN_SCALE_1*OD_CGAIN_SCALE_1)
|
|
|
|
/* Largest PVQ partition is half the coefficients of largest block size. */
|
|
#define MAXN (OD_TXSIZE_MAX*OD_TXSIZE_MAX/2)
|
|
|
|
#define OD_COMPAND_SHIFT (8 + OD_COEFF_SHIFT)
|
|
#define OD_COMPAND_SCALE (1 << OD_COMPAND_SHIFT)
|
|
#define OD_COMPAND_SCALE_1 (1./OD_COMPAND_SCALE)
|
|
|
|
#define OD_QM_SIZE (OD_TXSIZES*(OD_TXSIZES + 1))
|
|
|
|
#define OD_FLAT_QM 0
|
|
#define OD_HVS_QM 1
|
|
|
|
# define OD_NSB_ADAPT_CTXS (4)
|
|
|
|
# define OD_ADAPT_K_Q8 0
|
|
# define OD_ADAPT_SUM_EX_Q8 1
|
|
# define OD_ADAPT_COUNT_Q8 2
|
|
# define OD_ADAPT_COUNT_EX_Q8 3
|
|
|
|
# define OD_ADAPT_NO_VALUE (-2147483647-1)
|
|
|
|
typedef enum {
|
|
PVQ_SKIP = 0x0,
|
|
DC_CODED = 0x1,
|
|
AC_CODED = 0x2,
|
|
AC_DC_CODED = 0x3,
|
|
} PVQ_SKIP_TYPE;
|
|
|
|
typedef struct od_pvq_adapt_ctx od_pvq_adapt_ctx;
|
|
typedef struct od_pvq_codeword_ctx od_pvq_codeword_ctx;
|
|
|
|
struct od_pvq_codeword_ctx {
|
|
int pvq_adapt[2*OD_TXSIZES*OD_NSB_ADAPT_CTXS];
|
|
int pvq_k1_increment;
|
|
/* CDFs are size 16 despite the fact that we're using less than that. */
|
|
uint16_t pvq_k1_cdf[12][16];
|
|
uint16_t pvq_split_cdf[22*7][8];
|
|
int pvq_split_increment;
|
|
};
|
|
|
|
struct od_pvq_adapt_ctx {
|
|
od_pvq_codeword_ctx pvq_codeword_ctx;
|
|
generic_encoder pvq_param_model[3];
|
|
int pvq_ext[OD_TXSIZES*PVQ_MAX_PARTITIONS];
|
|
int pvq_exg[OD_NPLANES_MAX][OD_TXSIZES][PVQ_MAX_PARTITIONS];
|
|
int pvq_gaintheta_increment;
|
|
uint16_t pvq_gaintheta_cdf[2*OD_TXSIZES*PVQ_MAX_PARTITIONS][16];
|
|
int pvq_skip_dir_increment;
|
|
uint16_t pvq_skip_dir_cdf[2*(OD_TXSIZES-1)][7];
|
|
};
|
|
|
|
typedef struct od_qm_entry {
|
|
int interp_q;
|
|
int scale_q8;
|
|
const unsigned char *qm_q4;
|
|
} od_qm_entry;
|
|
|
|
extern const od_qm_entry OD_DEFAULT_QMS[2][2][OD_NPLANES_MAX];
|
|
|
|
void od_adapt_pvq_ctx_reset(od_pvq_adapt_ctx *state, int is_keyframe);
|
|
int od_pvq_size_ctx(int n);
|
|
int od_pvq_k1_ctx(int n, int orig_size);
|
|
|
|
od_val16 od_pvq_sin(od_val32 x);
|
|
od_val16 od_pvq_cos(od_val32 x);
|
|
#if !defined(OD_FLOAT_PVQ)
|
|
int od_vector_log_mag(const od_coeff *x, int n);
|
|
#endif
|
|
|
|
void od_interp_qm(unsigned char *out, int q, const od_qm_entry *entry1,
|
|
const od_qm_entry *entry2);
|
|
|
|
int od_qm_get_index(int bs, int band);
|
|
|
|
extern const od_val16 *const OD_PVQ_BETA[2][OD_NPLANES_MAX][OD_TXSIZES + 1];
|
|
|
|
void od_init_qm(int16_t *x, int16_t *x_inv, const int *qm);
|
|
int od_compute_householder(od_val16 *r, int n, od_val32 gr, int *sign,
|
|
int shift);
|
|
void od_apply_householder(od_val16 *out, const od_val16 *x, const od_val16 *r,
|
|
int n);
|
|
void od_pvq_synthesis_partial(od_coeff *xcoeff, const od_coeff *ypulse,
|
|
const od_val16 *r, int n,
|
|
int noref, od_val32 g,
|
|
od_val32 theta, int m, int s,
|
|
const int16_t *qm_inv);
|
|
od_val32 od_gain_expand(od_val32 cg, int q0, od_val16 beta);
|
|
od_val32 od_pvq_compute_gain(const od_val16 *x, int n, int q0, od_val32 *g,
|
|
od_val16 beta, int bshift);
|
|
int od_pvq_compute_max_theta(od_val32 qcg, od_val16 beta);
|
|
od_val32 od_pvq_compute_theta(int t, int max_theta);
|
|
int od_pvq_compute_k(od_val32 qcg, int itheta, od_val32 theta, int noref,
|
|
int n, od_val16 beta, int nodesync);
|
|
|
|
int od_vector_is_null(const od_coeff *x, int len);
|
|
int od_qm_offset(int bs, int xydec);
|
|
|
|
#endif
|