2015-08-06 05:00:31 +03:00
|
|
|
/*
|
2016-07-29 01:51:12 +03:00
|
|
|
* Copyright (c) 2016, Alliance for Open Media. All rights reserved
|
2015-08-06 05:00:31 +03:00
|
|
|
*
|
2016-07-29 01:51:12 +03:00
|
|
|
* This source code is subject to the terms of the BSD 2 Clause License and
|
|
|
|
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
|
|
|
|
* was not distributed with this source code in the LICENSE file, you can
|
|
|
|
* obtain it at www.aomedia.org/license/software. If the Alliance for Open
|
|
|
|
* Media Patent License 1.0 was not distributed with this source code in the
|
|
|
|
* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
|
2015-08-06 05:00:31 +03:00
|
|
|
*/
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
#ifndef AV1_ENCODER_ENCODER_H_
|
|
|
|
#define AV1_ENCODER_ENCODER_H_
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
#include <stdio.h>
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
#include "./aom_config.h"
|
|
|
|
#include "aom/aomcx.h"
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-23 02:08:15 +03:00
|
|
|
#include "av1/common/alloccommon.h"
|
|
|
|
#include "av1/common/entropymode.h"
|
|
|
|
#include "av1/common/thread_common.h"
|
|
|
|
#include "av1/common/onyxc_int.h"
|
|
|
|
#include "av1/encoder/aq_cyclicrefresh.h"
|
2016-04-14 00:53:34 +03:00
|
|
|
#if CONFIG_ANS
|
2016-09-18 01:11:16 +03:00
|
|
|
#include "aom_dsp/buf_ans.h"
|
2016-04-14 00:53:34 +03:00
|
|
|
#endif
|
2016-08-23 02:08:15 +03:00
|
|
|
#include "av1/encoder/context_tree.h"
|
|
|
|
#include "av1/encoder/encodemb.h"
|
|
|
|
#include "av1/encoder/firstpass.h"
|
|
|
|
#include "av1/encoder/lookahead.h"
|
|
|
|
#include "av1/encoder/mbgraph.h"
|
|
|
|
#include "av1/encoder/mcomp.h"
|
|
|
|
#include "av1/encoder/quantize.h"
|
|
|
|
#include "av1/encoder/ratectrl.h"
|
|
|
|
#include "av1/encoder/rd.h"
|
|
|
|
#include "av1/encoder/speed_features.h"
|
|
|
|
#include "av1/encoder/tokenize.h"
|
|
|
|
#include "av1/encoder/variance_tree.h"
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2015-08-12 08:21:38 +03:00
|
|
|
#if CONFIG_INTERNAL_STATS
|
2016-08-23 02:08:15 +03:00
|
|
|
#include "aom_dsp/ssim.h"
|
2015-08-12 08:21:38 +03:00
|
|
|
#endif
|
2016-08-23 02:08:15 +03:00
|
|
|
#include "aom_dsp/variance.h"
|
2016-08-31 00:01:10 +03:00
|
|
|
#include "aom/internal/aom_codec_internal.h"
|
|
|
|
#include "aom_util/aom_thread.h"
|
2015-08-12 08:21:38 +03:00
|
|
|
|
2015-08-06 05:00:31 +03:00
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
int nmvjointcost[MV_JOINTS];
|
|
|
|
int nmvcosts[2][MV_VALS];
|
|
|
|
int nmvcosts_hp[2][MV_VALS];
|
|
|
|
|
2016-02-19 21:41:04 +03:00
|
|
|
#if CONFIG_REF_MV
|
|
|
|
int nmv_vec_cost[NMV_CONTEXTS][MV_JOINTS];
|
|
|
|
int nmv_costs[NMV_CONTEXTS][2][MV_VALS];
|
|
|
|
int nmv_costs_hp[NMV_CONTEXTS][2][MV_VALS];
|
|
|
|
#endif
|
|
|
|
|
2015-08-06 05:00:31 +03:00
|
|
|
// 0 = Intra, Last, GF, ARF
|
Code refactoring on Macros related to ref frame numbers
We have renamed following Macros to avoid name confusion:
REFS_PER_FRAME --> INTER_REFS_PER_FRAME
(= ALTREF_FRAME - LAST_FRAME + 1)
MAX_REF_FRAMES --> TOTAL_REFS_PER_FRAME
(= ALTREF_FRAME - INTRA_FRAME + 1)
INTER_REFS_PER_FRAME specifies the maximum number of reference frames
that each Inter frame may use.
TOTAL_REFS_PER_FRAME is equal to INTER_REFS_PER_FRAME + 1, which
counts the INTRA_FRAME.
Further, at the encoder side, since REF_FRAMES specifies the maximum
number of the reference frames that the encoder may store, REF_FRAMES
is usually larger than INTER_REFS_PER_FRAME. For example, in the
ext-refs experiment, REF_FRAMES == 8, which allows the encoder to
store maximum 8 reference frames in the buffer, but
INTER_REFS_PER_FRAME equals to 6, which allows each Inter frame may
use up to 6 frames out of the 8 buffered frames as its references.
Hence, in order to explore the possibility to store more reference
frames in future patches, we modified a couple of array sizes to
accomodate the case that the number of buffered reference frames is
not always equal to the number of the references that are being used
by each Inter frame.
Change-Id: I19e42ef608946cc76ebfd3e965a05f4b9b93a0b3
2016-08-04 00:46:43 +03:00
|
|
|
signed char last_ref_lf_deltas[TOTAL_REFS_PER_FRAME];
|
2015-08-06 05:00:31 +03:00
|
|
|
// 0 = ZERO_MV, MV
|
|
|
|
signed char last_mode_lf_deltas[MAX_MODE_LF_DELTAS];
|
|
|
|
|
|
|
|
FRAME_CONTEXT fc;
|
|
|
|
} CODING_CONTEXT;
|
|
|
|
|
2016-07-27 19:12:53 +03:00
|
|
|
typedef enum {
|
|
|
|
// regular inter frame
|
|
|
|
REGULAR_FRAME = 0,
|
|
|
|
// alternate reference frame
|
|
|
|
ARF_FRAME = 1,
|
|
|
|
// overlay frame
|
|
|
|
OVERLAY_FRAME = 2,
|
|
|
|
// golden frame
|
|
|
|
GLD_FRAME = 3,
|
|
|
|
#if CONFIG_EXT_REFS
|
|
|
|
// backward reference frame
|
|
|
|
BRF_FRAME = 4,
|
2016-08-23 01:52:32 +03:00
|
|
|
// extra alternate reference frame
|
|
|
|
EXT_ARF_FRAME = 5
|
2016-07-27 19:12:53 +03:00
|
|
|
#endif
|
|
|
|
} FRAME_CONTEXT_INDEX;
|
|
|
|
|
2015-08-06 05:00:31 +03:00
|
|
|
typedef enum {
|
2016-08-12 06:13:14 +03:00
|
|
|
NORMAL = 0,
|
|
|
|
FOURFIVE = 1,
|
|
|
|
THREEFIVE = 2,
|
|
|
|
ONETWO = 3
|
2016-08-31 00:01:10 +03:00
|
|
|
} AOM_SCALING;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
// Good Quality Fast Encoding. The encoder balances quality with the amount of
|
|
|
|
// time it takes to encode the output. Speed setting controls how fast.
|
|
|
|
GOOD,
|
|
|
|
|
|
|
|
// The encoder places priority on the quality of the output over encoding
|
|
|
|
// speed. The output is compressed at the highest possible quality. This
|
|
|
|
// option takes the longest amount of time to encode. Speed setting ignored.
|
|
|
|
BEST,
|
|
|
|
|
|
|
|
// Realtime/Live Encoding. This mode is optimized for realtime encoding (for
|
|
|
|
// example, capturing a television signal or feed from a live camera). Speed
|
|
|
|
// setting controls how fast.
|
|
|
|
REALTIME
|
|
|
|
} MODE;
|
|
|
|
|
|
|
|
typedef enum {
|
2016-08-12 06:13:14 +03:00
|
|
|
FRAMEFLAGS_KEY = 1 << 0,
|
2015-08-06 05:00:31 +03:00
|
|
|
FRAMEFLAGS_GOLDEN = 1 << 1,
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2016-02-04 20:47:46 +03:00
|
|
|
FRAMEFLAGS_BWDREF = 1 << 2,
|
|
|
|
FRAMEFLAGS_ALTREF = 1 << 3,
|
|
|
|
#else
|
2015-08-06 05:00:31 +03:00
|
|
|
FRAMEFLAGS_ALTREF = 1 << 2,
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2015-08-06 05:00:31 +03:00
|
|
|
} FRAMETYPE_FLAGS;
|
|
|
|
|
|
|
|
typedef enum {
|
|
|
|
NO_AQ = 0,
|
|
|
|
VARIANCE_AQ = 1,
|
|
|
|
COMPLEXITY_AQ = 2,
|
|
|
|
CYCLIC_REFRESH_AQ = 3,
|
2016-08-15 16:07:52 +03:00
|
|
|
#if CONFIG_DELTA_Q
|
|
|
|
DELTA_AQ = 4,
|
|
|
|
#endif
|
2015-08-06 05:00:31 +03:00
|
|
|
AQ_MODE_COUNT // This should always be the last member of the enum
|
|
|
|
} AQ_MODE;
|
|
|
|
|
|
|
|
typedef enum {
|
2015-08-28 01:11:38 +03:00
|
|
|
RESIZE_NONE = 0, // No frame resizing allowed.
|
2015-08-06 05:00:31 +03:00
|
|
|
RESIZE_FIXED = 1, // All frames are coded at the specified dimension.
|
|
|
|
RESIZE_DYNAMIC = 2 // Coded size of each frame is determined by the codec.
|
|
|
|
} RESIZE_TYPE;
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
typedef struct AV1EncoderConfig {
|
2015-08-06 05:00:31 +03:00
|
|
|
BITSTREAM_PROFILE profile;
|
2016-08-31 00:01:10 +03:00
|
|
|
aom_bit_depth_t bit_depth; // Codec bit-depth.
|
2016-08-12 06:13:14 +03:00
|
|
|
int width; // width of data passed to the compressor
|
|
|
|
int height; // height of data passed to the compressor
|
2015-08-06 05:00:31 +03:00
|
|
|
unsigned int input_bit_depth; // Input bit depth.
|
2016-08-12 06:13:14 +03:00
|
|
|
double init_framerate; // set to passed in framerate
|
|
|
|
int64_t target_bandwidth; // bandwidth to be used in bits per second
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
int noise_sensitivity; // pre processing blur: recommendation 0
|
2016-08-12 06:13:14 +03:00
|
|
|
int sharpness; // sharpening output: recommendation 0:
|
2015-08-06 05:00:31 +03:00
|
|
|
int speed;
|
|
|
|
// maximum allowed bitrate for any intra frame in % of bitrate target.
|
|
|
|
unsigned int rc_max_intra_bitrate_pct;
|
|
|
|
// maximum allowed bitrate for any inter frame in % of bitrate target.
|
|
|
|
unsigned int rc_max_inter_bitrate_pct;
|
|
|
|
// percent of rate boost for golden frame in CBR mode.
|
|
|
|
unsigned int gf_cbr_boost_pct;
|
|
|
|
|
|
|
|
MODE mode;
|
|
|
|
int pass;
|
|
|
|
|
|
|
|
// Key Framing Operations
|
|
|
|
int auto_key; // autodetect cut scenes and set the keyframes
|
|
|
|
int key_freq; // maximum distance to key frame.
|
|
|
|
|
|
|
|
int lag_in_frames; // how many frames lag before we start encoding
|
|
|
|
|
|
|
|
// ----------------------------------------------------------------
|
|
|
|
// DATARATE CONTROL OPTIONS
|
|
|
|
|
|
|
|
// vbr, cbr, constrained quality or constant quality
|
2016-08-31 00:01:10 +03:00
|
|
|
enum aom_rc_mode rc_mode;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
// buffer targeting aggressiveness
|
|
|
|
int under_shoot_pct;
|
|
|
|
int over_shoot_pct;
|
|
|
|
|
|
|
|
// buffering parameters
|
|
|
|
int64_t starting_buffer_level_ms;
|
|
|
|
int64_t optimal_buffer_level_ms;
|
|
|
|
int64_t maximum_buffer_size_ms;
|
|
|
|
|
|
|
|
// Frame drop threshold.
|
|
|
|
int drop_frames_water_mark;
|
|
|
|
|
|
|
|
// controlling quality
|
|
|
|
int fixed_q;
|
|
|
|
int worst_allowed_q;
|
|
|
|
int best_allowed_q;
|
|
|
|
int cq_level;
|
|
|
|
AQ_MODE aq_mode; // Adaptive Quantization mode
|
2016-08-11 19:39:47 +03:00
|
|
|
#if CONFIG_AOM_QM
|
|
|
|
int using_qm;
|
|
|
|
int qm_minlevel;
|
|
|
|
int qm_maxlevel;
|
|
|
|
#endif
|
2016-11-09 17:04:18 +03:00
|
|
|
#if CONFIG_TILE_GROUPS
|
|
|
|
unsigned int num_tile_groups;
|
|
|
|
unsigned int mtu;
|
|
|
|
#endif
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
// Internal frame size scaling.
|
|
|
|
RESIZE_TYPE resize_mode;
|
|
|
|
int scaled_frame_width;
|
|
|
|
int scaled_frame_height;
|
|
|
|
|
|
|
|
// Enable feature to reduce the frame quantization every x frames.
|
|
|
|
int frame_periodic_boost;
|
|
|
|
|
|
|
|
// two pass datarate control
|
2016-08-12 06:13:14 +03:00
|
|
|
int two_pass_vbrbias; // two pass datarate control tweaks
|
2015-08-06 05:00:31 +03:00
|
|
|
int two_pass_vbrmin_section;
|
|
|
|
int two_pass_vbrmax_section;
|
|
|
|
// END DATARATE CONTROL OPTIONS
|
|
|
|
// ----------------------------------------------------------------
|
|
|
|
|
|
|
|
int enable_auto_arf;
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2016-02-04 20:47:46 +03:00
|
|
|
int enable_auto_brf; // (b)ackward (r)ef (f)rame
|
2016-08-12 06:13:14 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
/* Bitfield defining the error resiliency features to enable.
|
|
|
|
* Can provide decodable frames after losses in previous
|
|
|
|
* frames and decodable partitions after losses in the same frame.
|
|
|
|
*/
|
|
|
|
unsigned int error_resilient_mode;
|
|
|
|
|
|
|
|
/* Bitfield defining the parallel decoding mode where the
|
|
|
|
* decoding in successive frames may be conducted in parallel
|
|
|
|
* just by decoding the frame headers.
|
|
|
|
*/
|
|
|
|
unsigned int frame_parallel_decoding_mode;
|
|
|
|
|
|
|
|
int arnr_max_frames;
|
|
|
|
int arnr_strength;
|
|
|
|
|
|
|
|
int min_gf_interval;
|
|
|
|
int max_gf_interval;
|
|
|
|
|
|
|
|
int tile_columns;
|
|
|
|
int tile_rows;
|
2016-12-09 08:08:31 +03:00
|
|
|
#if CONFIG_DEBLOCKING_ACROSS_TILES
|
|
|
|
int loop_filter_across_tiles_enabled;
|
|
|
|
#endif // CONFIG_DEBLOCKING_ACROSS_TILES
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
int max_threads;
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
aom_fixed_buf_t two_pass_stats_in;
|
|
|
|
struct aom_codec_pkt_list *output_pkt_list;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
#if CONFIG_FP_MB_STATS
|
2016-08-31 00:01:10 +03:00
|
|
|
aom_fixed_buf_t firstpass_mb_stats_in;
|
2015-08-06 05:00:31 +03:00
|
|
|
#endif
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
aom_tune_metric tuning;
|
|
|
|
aom_tune_content content;
|
|
|
|
#if CONFIG_AOM_HIGHBITDEPTH
|
2015-08-06 05:00:31 +03:00
|
|
|
int use_highbitdepth;
|
|
|
|
#endif
|
2016-08-31 00:01:10 +03:00
|
|
|
aom_color_space_t color_space;
|
2015-09-16 04:56:51 +03:00
|
|
|
int color_range;
|
2015-09-29 01:55:46 +03:00
|
|
|
int render_width;
|
|
|
|
int render_height;
|
Make superblock size variable at the frame level.
The uncompressed frame header contains a bit to signal whether the
frame is encoded using 64x64 or 128x128 superblocks. This can vary
between any 2 frames.
vpxenc gained the --sb-size={64,128,dynamic} option, which allows the
configuration of the superblock size used (default is dynamic). 64/128
will force the encoder to always use the specified superblock size.
Dynamic would enable the encoder to choose the sb size for each
frame, but this is not implemented yet (dynamic does the same as 128
for now).
Constraints on tile sizes depend on the superblock size, the following
is a summary of the current bitstream syntax and semantics:
If both --enable-ext-tile is OFF and --enable-ext-partition is OFF:
The tile coding in this case is the same as VP9. In particular,
tiles have a minimum width of 256 pixels and a maximum width of
4096 pixels. The tile width must be multiples of 64 pixels
(except for the rightmost tile column). There can be a maximum
of 64 tile columns and 4 tile rows.
If --enable-ext-tile is OFF and --enable-ext-partition is ON:
Same constraints as above, except that tile width must be
multiples of 128 pixels (except for the rightmost tile column).
There is no change in the bitstream syntax used for coding the tile
configuration if --enable-ext-tile is OFF.
If --enable-ext-tile is ON and --enable-ext-partition is ON:
This is the new large scale tile coding configuration. The
minimum/maximum tile width and height are 64/4096 pixels. Tile
width and height must be multiples of 64 pixels. The uncompressed
header contains two 6 bit fields that hold the tile width/heigh
in units of 64 pixels. The maximum number of tile rows/columns
is only limited by the maximum frame size of 65536x65536 pixels
that can be coded in the bitstream. This yields a maximum of
1024x1024 tile rows and columns (of 64x64 tiles in a 65536x65536
frame).
If both --enable-ext-tile is ON and --enable-ext-partition is ON:
Same applies as above, except that in the bitstream the 2 fields
containing the tile width/height are in units of the superblock
size, and the superblock size itself is also coded in the bitstream.
If the uncompressed header signals the use of 64x64 superblocks,
then the tile width/height fields are 6 bits wide and are in units
of 64 pixels. If the uncompressed header signals the use of 128x128
superblocks, then the tile width/height fields are 5 bits wide and
are in units of 128 pixels.
The above is a summary of the bitstream. The user interface to vpxenc
(and the equivalent encoder API) behaves a follows:
If --enable-ext-tile is OFF:
No change in the user interface. --tile-columns and --tile-rows
specify the base 2 logarithm of the desired number of tile columns
and tile rows. The actual number of tile rows and tile columns,
and the particular tile width and tile height are computed by the
codec ensuring all of the above constraints are respected.
If --enable-ext-tile is ON, but --enable-ext-partition is OFF:
No change in the user interface. --tile-columns and --tile-rows
specify the WIDTH and HEIGHT of the tiles in unit of 64 pixels.
The valid values are in the range [1, 64] (which corresponds to
[64, 4096] pixels in increments of 64.
If both --enable-ext-tile is ON and --enable-ext-partition is ON:
If --sb-size=64 (default):
The user interface is the same as in the previous point.
--tile-columns and --tile-rows specify tile WIDTH and HEIGHT,
in units of 64 pixels, in the range [1, 64] (which corresponds
to [64, 4096] pixels in increments of 64).
If --sb-size=128 or --sb-size=dynamic:
--tile-columns and --tile-rows specify tile WIDTH and HEIGHT,
in units of 128 pixels in the range [1, 32] (which corresponds
to [128, 4096] pixels in increments of 128).
Change-Id: Idc9beee1ad12ff1634e83671985d14c680f9179a
2016-03-24 16:56:05 +03:00
|
|
|
|
|
|
|
#if CONFIG_EXT_PARTITION
|
2016-08-31 00:01:10 +03:00
|
|
|
aom_superblock_size_t superblock_size;
|
Make superblock size variable at the frame level.
The uncompressed frame header contains a bit to signal whether the
frame is encoded using 64x64 or 128x128 superblocks. This can vary
between any 2 frames.
vpxenc gained the --sb-size={64,128,dynamic} option, which allows the
configuration of the superblock size used (default is dynamic). 64/128
will force the encoder to always use the specified superblock size.
Dynamic would enable the encoder to choose the sb size for each
frame, but this is not implemented yet (dynamic does the same as 128
for now).
Constraints on tile sizes depend on the superblock size, the following
is a summary of the current bitstream syntax and semantics:
If both --enable-ext-tile is OFF and --enable-ext-partition is OFF:
The tile coding in this case is the same as VP9. In particular,
tiles have a minimum width of 256 pixels and a maximum width of
4096 pixels. The tile width must be multiples of 64 pixels
(except for the rightmost tile column). There can be a maximum
of 64 tile columns and 4 tile rows.
If --enable-ext-tile is OFF and --enable-ext-partition is ON:
Same constraints as above, except that tile width must be
multiples of 128 pixels (except for the rightmost tile column).
There is no change in the bitstream syntax used for coding the tile
configuration if --enable-ext-tile is OFF.
If --enable-ext-tile is ON and --enable-ext-partition is ON:
This is the new large scale tile coding configuration. The
minimum/maximum tile width and height are 64/4096 pixels. Tile
width and height must be multiples of 64 pixels. The uncompressed
header contains two 6 bit fields that hold the tile width/heigh
in units of 64 pixels. The maximum number of tile rows/columns
is only limited by the maximum frame size of 65536x65536 pixels
that can be coded in the bitstream. This yields a maximum of
1024x1024 tile rows and columns (of 64x64 tiles in a 65536x65536
frame).
If both --enable-ext-tile is ON and --enable-ext-partition is ON:
Same applies as above, except that in the bitstream the 2 fields
containing the tile width/height are in units of the superblock
size, and the superblock size itself is also coded in the bitstream.
If the uncompressed header signals the use of 64x64 superblocks,
then the tile width/height fields are 6 bits wide and are in units
of 64 pixels. If the uncompressed header signals the use of 128x128
superblocks, then the tile width/height fields are 5 bits wide and
are in units of 128 pixels.
The above is a summary of the bitstream. The user interface to vpxenc
(and the equivalent encoder API) behaves a follows:
If --enable-ext-tile is OFF:
No change in the user interface. --tile-columns and --tile-rows
specify the base 2 logarithm of the desired number of tile columns
and tile rows. The actual number of tile rows and tile columns,
and the particular tile width and tile height are computed by the
codec ensuring all of the above constraints are respected.
If --enable-ext-tile is ON, but --enable-ext-partition is OFF:
No change in the user interface. --tile-columns and --tile-rows
specify the WIDTH and HEIGHT of the tiles in unit of 64 pixels.
The valid values are in the range [1, 64] (which corresponds to
[64, 4096] pixels in increments of 64.
If both --enable-ext-tile is ON and --enable-ext-partition is ON:
If --sb-size=64 (default):
The user interface is the same as in the previous point.
--tile-columns and --tile-rows specify tile WIDTH and HEIGHT,
in units of 64 pixels, in the range [1, 64] (which corresponds
to [64, 4096] pixels in increments of 64).
If --sb-size=128 or --sb-size=dynamic:
--tile-columns and --tile-rows specify tile WIDTH and HEIGHT,
in units of 128 pixels in the range [1, 32] (which corresponds
to [128, 4096] pixels in increments of 128).
Change-Id: Idc9beee1ad12ff1634e83671985d14c680f9179a
2016-03-24 16:56:05 +03:00
|
|
|
#endif // CONFIG_EXT_PARTITION
|
2016-08-31 00:01:10 +03:00
|
|
|
} AV1EncoderConfig;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
static INLINE int is_lossless_requested(const AV1EncoderConfig *cfg) {
|
2015-08-06 05:00:31 +03:00
|
|
|
return cfg->best_allowed_q == 0 && cfg->worst_allowed_q == 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// TODO(jingning) All spatially adaptive variables should go to TileDataEnc.
|
|
|
|
typedef struct TileDataEnc {
|
|
|
|
TileInfo tile_info;
|
|
|
|
int thresh_freq_fact[BLOCK_SIZES][MAX_MODES];
|
|
|
|
int mode_map[BLOCK_SIZES][MAX_MODES];
|
2016-10-26 01:15:23 +03:00
|
|
|
int m_search_count;
|
|
|
|
int ex_search_count;
|
2016-11-05 02:36:56 +03:00
|
|
|
#if CONFIG_PVQ
|
|
|
|
PVQ_QUEUE pvq_q;
|
|
|
|
#endif
|
2015-08-06 05:00:31 +03:00
|
|
|
} TileDataEnc;
|
|
|
|
|
|
|
|
typedef struct RD_COUNTS {
|
2016-08-31 00:01:10 +03:00
|
|
|
av1_coeff_count coef_counts[TX_SIZES][PLANE_TYPES];
|
2015-08-06 05:00:31 +03:00
|
|
|
int64_t comp_pred_diff[REFERENCE_MODES];
|
|
|
|
} RD_COUNTS;
|
|
|
|
|
|
|
|
typedef struct ThreadData {
|
|
|
|
MACROBLOCK mb;
|
|
|
|
RD_COUNTS rd_counts;
|
|
|
|
FRAME_COUNTS *counts;
|
|
|
|
|
|
|
|
PICK_MODE_CONTEXT *leaf_tree;
|
|
|
|
PC_TREE *pc_tree;
|
2016-04-08 17:15:06 +03:00
|
|
|
PC_TREE *pc_root[MAX_MIB_SIZE_LOG2 - MIN_MIB_SIZE_LOG2 + 1];
|
2016-04-11 19:41:58 +03:00
|
|
|
|
|
|
|
VAR_TREE *var_tree;
|
|
|
|
VAR_TREE *var_root[MAX_MIB_SIZE_LOG2 - MIN_MIB_SIZE_LOG2 + 1];
|
2015-08-06 05:00:31 +03:00
|
|
|
} ThreadData;
|
|
|
|
|
|
|
|
struct EncWorkerData;
|
|
|
|
|
|
|
|
typedef struct ActiveMap {
|
|
|
|
int enabled;
|
|
|
|
int update;
|
|
|
|
unsigned char *map;
|
|
|
|
} ActiveMap;
|
|
|
|
|
2016-10-18 02:38:05 +03:00
|
|
|
#define NUM_STAT_TYPES 4 // types of stats: Y, U, V and ALL
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
typedef struct IMAGE_STAT {
|
2016-10-18 02:38:05 +03:00
|
|
|
double stat[NUM_STAT_TYPES];
|
2015-08-06 05:00:31 +03:00
|
|
|
double worst;
|
|
|
|
} ImageStat;
|
|
|
|
|
2016-10-18 02:38:05 +03:00
|
|
|
#undef NUM_STAT_TYPES
|
|
|
|
|
2016-02-17 01:33:18 +03:00
|
|
|
typedef struct {
|
|
|
|
int ref_count;
|
|
|
|
YV12_BUFFER_CONFIG buf;
|
|
|
|
} EncRefCntBuffer;
|
|
|
|
|
2016-01-08 01:29:26 +03:00
|
|
|
#if CONFIG_ENTROPY
|
|
|
|
typedef struct SUBFRAME_STATS {
|
2016-08-31 00:01:10 +03:00
|
|
|
av1_coeff_probs_model coef_probs_buf[COEF_PROBS_BUFS][TX_SIZES][PLANE_TYPES];
|
|
|
|
av1_coeff_count coef_counts_buf[COEF_PROBS_BUFS][TX_SIZES][PLANE_TYPES];
|
2016-08-12 06:13:14 +03:00
|
|
|
unsigned int eob_counts_buf[COEF_PROBS_BUFS][TX_SIZES][PLANE_TYPES][REF_TYPES]
|
|
|
|
[COEF_BANDS][COEFF_CONTEXTS];
|
2016-08-31 00:01:10 +03:00
|
|
|
av1_coeff_probs_model enc_starting_coef_probs[TX_SIZES][PLANE_TYPES];
|
2016-01-08 01:29:26 +03:00
|
|
|
} SUBFRAME_STATS;
|
|
|
|
#endif // CONFIG_ENTROPY
|
|
|
|
|
2016-03-11 20:42:49 +03:00
|
|
|
typedef struct TileBufferEnc {
|
|
|
|
uint8_t *data;
|
|
|
|
size_t size;
|
|
|
|
} TileBufferEnc;
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
typedef struct AV1_COMP {
|
2015-08-06 05:00:31 +03:00
|
|
|
QUANTS quants;
|
|
|
|
ThreadData td;
|
|
|
|
MB_MODE_INFO_EXT *mbmi_ext_base;
|
2016-03-07 16:46:39 +03:00
|
|
|
DECLARE_ALIGNED(16, int16_t, y_dequant[QINDEX_RANGE][8]); // 8: SIMD width
|
|
|
|
DECLARE_ALIGNED(16, int16_t, uv_dequant[QINDEX_RANGE][8]); // 8: SIMD width
|
2016-05-11 01:32:42 +03:00
|
|
|
#if CONFIG_NEW_QUANT
|
|
|
|
DECLARE_ALIGNED(16, dequant_val_type_nuq,
|
2016-06-11 01:29:10 +03:00
|
|
|
y_dequant_val_nuq[QUANT_PROFILES][QINDEX_RANGE][COEF_BANDS]);
|
2016-05-11 01:32:42 +03:00
|
|
|
DECLARE_ALIGNED(16, dequant_val_type_nuq,
|
2016-06-11 01:29:10 +03:00
|
|
|
uv_dequant_val_nuq[QUANT_PROFILES][QINDEX_RANGE][COEF_BANDS]);
|
2016-05-11 01:32:42 +03:00
|
|
|
#endif // CONFIG_NEW_QUANT
|
2016-08-31 00:01:10 +03:00
|
|
|
AV1_COMMON common;
|
|
|
|
AV1EncoderConfig oxcf;
|
2016-08-12 06:13:14 +03:00
|
|
|
struct lookahead_ctx *lookahead;
|
|
|
|
struct lookahead_entry *alt_ref_source;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
YV12_BUFFER_CONFIG *Source;
|
|
|
|
YV12_BUFFER_CONFIG *Last_Source; // NULL for first frame and alt_ref frames
|
|
|
|
YV12_BUFFER_CONFIG *un_scaled_source;
|
|
|
|
YV12_BUFFER_CONFIG scaled_source;
|
|
|
|
YV12_BUFFER_CONFIG *unscaled_last_source;
|
|
|
|
YV12_BUFFER_CONFIG scaled_last_source;
|
|
|
|
|
2016-02-17 01:33:18 +03:00
|
|
|
// Up-sampled reference buffers
|
Code refactoring on Macros related to ref frame numbers
We have renamed following Macros to avoid name confusion:
REFS_PER_FRAME --> INTER_REFS_PER_FRAME
(= ALTREF_FRAME - LAST_FRAME + 1)
MAX_REF_FRAMES --> TOTAL_REFS_PER_FRAME
(= ALTREF_FRAME - INTRA_FRAME + 1)
INTER_REFS_PER_FRAME specifies the maximum number of reference frames
that each Inter frame may use.
TOTAL_REFS_PER_FRAME is equal to INTER_REFS_PER_FRAME + 1, which
counts the INTRA_FRAME.
Further, at the encoder side, since REF_FRAMES specifies the maximum
number of the reference frames that the encoder may store, REF_FRAMES
is usually larger than INTER_REFS_PER_FRAME. For example, in the
ext-refs experiment, REF_FRAMES == 8, which allows the encoder to
store maximum 8 reference frames in the buffer, but
INTER_REFS_PER_FRAME equals to 6, which allows each Inter frame may
use up to 6 frames out of the 8 buffered frames as its references.
Hence, in order to explore the possibility to store more reference
frames in future patches, we modified a couple of array sizes to
accomodate the case that the number of buffered reference frames is
not always equal to the number of the references that are being used
by each Inter frame.
Change-Id: I19e42ef608946cc76ebfd3e965a05f4b9b93a0b3
2016-08-04 00:46:43 +03:00
|
|
|
// NOTE(zoeliu): It is needed to allocate sufficient space to the up-sampled
|
|
|
|
// reference buffers, which should include the up-sampled version of all the
|
|
|
|
// possibly stored references plus the currently coded frame itself.
|
|
|
|
EncRefCntBuffer upsampled_ref_bufs[REF_FRAMES + 1];
|
|
|
|
int upsampled_ref_idx[REF_FRAMES + 1];
|
2016-02-17 01:33:18 +03:00
|
|
|
|
2015-08-06 05:00:31 +03:00
|
|
|
// For a still frame, this flag is set to 1 to skip partition search.
|
|
|
|
int partition_search_skippable_frame;
|
|
|
|
|
Code refactoring on Macros related to ref frame numbers
We have renamed following Macros to avoid name confusion:
REFS_PER_FRAME --> INTER_REFS_PER_FRAME
(= ALTREF_FRAME - LAST_FRAME + 1)
MAX_REF_FRAMES --> TOTAL_REFS_PER_FRAME
(= ALTREF_FRAME - INTRA_FRAME + 1)
INTER_REFS_PER_FRAME specifies the maximum number of reference frames
that each Inter frame may use.
TOTAL_REFS_PER_FRAME is equal to INTER_REFS_PER_FRAME + 1, which
counts the INTRA_FRAME.
Further, at the encoder side, since REF_FRAMES specifies the maximum
number of the reference frames that the encoder may store, REF_FRAMES
is usually larger than INTER_REFS_PER_FRAME. For example, in the
ext-refs experiment, REF_FRAMES == 8, which allows the encoder to
store maximum 8 reference frames in the buffer, but
INTER_REFS_PER_FRAME equals to 6, which allows each Inter frame may
use up to 6 frames out of the 8 buffered frames as its references.
Hence, in order to explore the possibility to store more reference
frames in future patches, we modified a couple of array sizes to
accomodate the case that the number of buffered reference frames is
not always equal to the number of the references that are being used
by each Inter frame.
Change-Id: I19e42ef608946cc76ebfd3e965a05f4b9b93a0b3
2016-08-04 00:46:43 +03:00
|
|
|
int scaled_ref_idx[TOTAL_REFS_PER_FRAME];
|
2015-11-12 13:12:17 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2015-12-03 03:27:46 +03:00
|
|
|
int lst_fb_idxes[LAST_REF_FRAMES];
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#else
|
2015-12-03 03:27:46 +03:00
|
|
|
int lst_fb_idx;
|
2015-11-12 13:12:17 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2015-08-06 05:00:31 +03:00
|
|
|
int gld_fb_idx;
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2016-02-04 20:47:46 +03:00
|
|
|
int bwd_fb_idx; // BWD_REF_FRAME
|
2016-08-12 06:13:14 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2015-08-06 05:00:31 +03:00
|
|
|
int alt_fb_idx;
|
|
|
|
|
2016-05-20 02:46:10 +03:00
|
|
|
int last_show_frame_buf_idx; // last show frame buffer index
|
|
|
|
|
2015-12-03 03:27:46 +03:00
|
|
|
int refresh_last_frame;
|
2015-08-06 05:00:31 +03:00
|
|
|
int refresh_golden_frame;
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2016-02-04 20:47:46 +03:00
|
|
|
int refresh_bwd_ref_frame;
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2015-08-06 05:00:31 +03:00
|
|
|
int refresh_alt_ref_frame;
|
|
|
|
|
|
|
|
int ext_refresh_frame_flags_pending;
|
2015-12-03 03:27:46 +03:00
|
|
|
int ext_refresh_last_frame;
|
2015-08-06 05:00:31 +03:00
|
|
|
int ext_refresh_golden_frame;
|
|
|
|
int ext_refresh_alt_ref_frame;
|
|
|
|
|
|
|
|
int ext_refresh_frame_context_pending;
|
|
|
|
int ext_refresh_frame_context;
|
|
|
|
|
|
|
|
YV12_BUFFER_CONFIG last_frame_uf;
|
2016-01-20 00:01:01 +03:00
|
|
|
#if CONFIG_LOOP_RESTORATION
|
|
|
|
YV12_BUFFER_CONFIG last_frame_db;
|
2016-12-16 00:23:21 +03:00
|
|
|
YV12_BUFFER_CONFIG trial_frame_rst;
|
2017-01-04 02:14:57 +03:00
|
|
|
uint8_t *extra_rstbuf; // Extra buffers used in restoration search
|
|
|
|
RestorationInfo rst_search[MAX_MB_PLANE]; // Used for encoder side search
|
|
|
|
#endif // CONFIG_LOOP_RESTORATION
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
// Ambient reconstruction err target for force key frames
|
|
|
|
int64_t ambient_err;
|
|
|
|
|
|
|
|
RD_OPT rd;
|
|
|
|
|
|
|
|
CODING_CONTEXT coding_context;
|
|
|
|
|
2016-02-19 21:41:04 +03:00
|
|
|
#if CONFIG_REF_MV
|
2016-07-25 23:38:49 +03:00
|
|
|
int nmv_costs[NMV_CONTEXTS][2][MV_VALS];
|
|
|
|
int nmv_costs_hp[NMV_CONTEXTS][2][MV_VALS];
|
2016-02-19 21:41:04 +03:00
|
|
|
#endif
|
|
|
|
|
2016-07-25 23:38:49 +03:00
|
|
|
int nmvcosts[2][MV_VALS];
|
|
|
|
int nmvcosts_hp[2][MV_VALS];
|
|
|
|
int nmvsadcosts[2][MV_VALS];
|
|
|
|
int nmvsadcosts_hp[2][MV_VALS];
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
int64_t last_time_stamp_seen;
|
|
|
|
int64_t last_end_time_stamp_seen;
|
|
|
|
int64_t first_time_stamp_ever;
|
|
|
|
|
|
|
|
RATE_CONTROL rc;
|
|
|
|
double framerate;
|
|
|
|
|
Code refactoring on Macros related to ref frame numbers
We have renamed following Macros to avoid name confusion:
REFS_PER_FRAME --> INTER_REFS_PER_FRAME
(= ALTREF_FRAME - LAST_FRAME + 1)
MAX_REF_FRAMES --> TOTAL_REFS_PER_FRAME
(= ALTREF_FRAME - INTRA_FRAME + 1)
INTER_REFS_PER_FRAME specifies the maximum number of reference frames
that each Inter frame may use.
TOTAL_REFS_PER_FRAME is equal to INTER_REFS_PER_FRAME + 1, which
counts the INTRA_FRAME.
Further, at the encoder side, since REF_FRAMES specifies the maximum
number of the reference frames that the encoder may store, REF_FRAMES
is usually larger than INTER_REFS_PER_FRAME. For example, in the
ext-refs experiment, REF_FRAMES == 8, which allows the encoder to
store maximum 8 reference frames in the buffer, but
INTER_REFS_PER_FRAME equals to 6, which allows each Inter frame may
use up to 6 frames out of the 8 buffered frames as its references.
Hence, in order to explore the possibility to store more reference
frames in future patches, we modified a couple of array sizes to
accomodate the case that the number of buffered reference frames is
not always equal to the number of the references that are being used
by each Inter frame.
Change-Id: I19e42ef608946cc76ebfd3e965a05f4b9b93a0b3
2016-08-04 00:46:43 +03:00
|
|
|
// NOTE(zoeliu): Any inter frame allows maximum of REF_FRAMES inter
|
|
|
|
// references; Plus the currently coded frame itself, it is needed to allocate
|
|
|
|
// sufficient space to the size of the maximum possible number of frames.
|
|
|
|
int interp_filter_selected[REF_FRAMES + 1][SWITCHABLE];
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
struct aom_codec_pkt_list *output_pkt_list;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
MBGRAPH_FRAME_STATS mbgraph_stats[MAX_LAG_BUFFERS];
|
2016-08-12 06:13:14 +03:00
|
|
|
int mbgraph_n_frames; // number of frames filled in the above
|
|
|
|
int static_mb_pct; // % forced skip mbs by segmentation
|
2015-08-06 05:00:31 +03:00
|
|
|
int ref_frame_flags;
|
|
|
|
|
|
|
|
SPEED_FEATURES sf;
|
|
|
|
|
|
|
|
unsigned int max_mv_magnitude;
|
|
|
|
int mv_step_param;
|
|
|
|
|
|
|
|
int allow_comp_inter_inter;
|
|
|
|
|
Make superblock size variable at the frame level.
The uncompressed frame header contains a bit to signal whether the
frame is encoded using 64x64 or 128x128 superblocks. This can vary
between any 2 frames.
vpxenc gained the --sb-size={64,128,dynamic} option, which allows the
configuration of the superblock size used (default is dynamic). 64/128
will force the encoder to always use the specified superblock size.
Dynamic would enable the encoder to choose the sb size for each
frame, but this is not implemented yet (dynamic does the same as 128
for now).
Constraints on tile sizes depend on the superblock size, the following
is a summary of the current bitstream syntax and semantics:
If both --enable-ext-tile is OFF and --enable-ext-partition is OFF:
The tile coding in this case is the same as VP9. In particular,
tiles have a minimum width of 256 pixels and a maximum width of
4096 pixels. The tile width must be multiples of 64 pixels
(except for the rightmost tile column). There can be a maximum
of 64 tile columns and 4 tile rows.
If --enable-ext-tile is OFF and --enable-ext-partition is ON:
Same constraints as above, except that tile width must be
multiples of 128 pixels (except for the rightmost tile column).
There is no change in the bitstream syntax used for coding the tile
configuration if --enable-ext-tile is OFF.
If --enable-ext-tile is ON and --enable-ext-partition is ON:
This is the new large scale tile coding configuration. The
minimum/maximum tile width and height are 64/4096 pixels. Tile
width and height must be multiples of 64 pixels. The uncompressed
header contains two 6 bit fields that hold the tile width/heigh
in units of 64 pixels. The maximum number of tile rows/columns
is only limited by the maximum frame size of 65536x65536 pixels
that can be coded in the bitstream. This yields a maximum of
1024x1024 tile rows and columns (of 64x64 tiles in a 65536x65536
frame).
If both --enable-ext-tile is ON and --enable-ext-partition is ON:
Same applies as above, except that in the bitstream the 2 fields
containing the tile width/height are in units of the superblock
size, and the superblock size itself is also coded in the bitstream.
If the uncompressed header signals the use of 64x64 superblocks,
then the tile width/height fields are 6 bits wide and are in units
of 64 pixels. If the uncompressed header signals the use of 128x128
superblocks, then the tile width/height fields are 5 bits wide and
are in units of 128 pixels.
The above is a summary of the bitstream. The user interface to vpxenc
(and the equivalent encoder API) behaves a follows:
If --enable-ext-tile is OFF:
No change in the user interface. --tile-columns and --tile-rows
specify the base 2 logarithm of the desired number of tile columns
and tile rows. The actual number of tile rows and tile columns,
and the particular tile width and tile height are computed by the
codec ensuring all of the above constraints are respected.
If --enable-ext-tile is ON, but --enable-ext-partition is OFF:
No change in the user interface. --tile-columns and --tile-rows
specify the WIDTH and HEIGHT of the tiles in unit of 64 pixels.
The valid values are in the range [1, 64] (which corresponds to
[64, 4096] pixels in increments of 64.
If both --enable-ext-tile is ON and --enable-ext-partition is ON:
If --sb-size=64 (default):
The user interface is the same as in the previous point.
--tile-columns and --tile-rows specify tile WIDTH and HEIGHT,
in units of 64 pixels, in the range [1, 64] (which corresponds
to [64, 4096] pixels in increments of 64).
If --sb-size=128 or --sb-size=dynamic:
--tile-columns and --tile-rows specify tile WIDTH and HEIGHT,
in units of 128 pixels in the range [1, 32] (which corresponds
to [128, 4096] pixels in increments of 128).
Change-Id: Idc9beee1ad12ff1634e83671985d14c680f9179a
2016-03-24 16:56:05 +03:00
|
|
|
uint8_t *segmentation_map;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
CYCLIC_REFRESH *cyclic_refresh;
|
|
|
|
ActiveMap active_map;
|
|
|
|
|
|
|
|
fractional_mv_step_fp *find_fractional_mv_step;
|
2016-08-31 00:01:10 +03:00
|
|
|
av1_full_search_fn_t full_search_sad; // It is currently unused.
|
|
|
|
av1_diamond_search_fn_t diamond_search_sad;
|
|
|
|
aom_variance_fn_ptr_t fn_ptr[BLOCK_SIZES];
|
2015-08-06 05:00:31 +03:00
|
|
|
uint64_t time_receive_data;
|
|
|
|
uint64_t time_compress_data;
|
|
|
|
uint64_t time_pick_lpf;
|
|
|
|
uint64_t time_encode_sb_row;
|
|
|
|
|
|
|
|
#if CONFIG_FP_MB_STATS
|
|
|
|
int use_fp_mb_stats;
|
|
|
|
#endif
|
|
|
|
|
|
|
|
TWO_PASS twopass;
|
|
|
|
|
|
|
|
YV12_BUFFER_CONFIG alt_ref_buffer;
|
|
|
|
|
|
|
|
#if CONFIG_INTERNAL_STATS
|
|
|
|
unsigned int mode_chosen_counts[MAX_MODES];
|
|
|
|
|
2016-08-12 06:13:14 +03:00
|
|
|
int count;
|
2015-08-06 05:00:31 +03:00
|
|
|
uint64_t total_sq_error;
|
|
|
|
uint64_t total_samples;
|
|
|
|
ImageStat psnr;
|
|
|
|
|
|
|
|
double total_blockiness;
|
|
|
|
double worst_blockiness;
|
|
|
|
|
2016-08-12 06:13:14 +03:00
|
|
|
int bytes;
|
2015-08-06 05:00:31 +03:00
|
|
|
double summed_quality;
|
|
|
|
double summed_weights;
|
|
|
|
unsigned int tot_recode_hits;
|
|
|
|
double worst_ssim;
|
|
|
|
|
|
|
|
ImageStat fastssim;
|
|
|
|
ImageStat psnrhvs;
|
|
|
|
|
|
|
|
int b_calculate_blockiness;
|
|
|
|
int b_calculate_consistency;
|
|
|
|
|
|
|
|
double total_inconsistency;
|
|
|
|
double worst_consistency;
|
|
|
|
Ssimv *ssim_vars;
|
|
|
|
Metrics metrics;
|
|
|
|
#endif
|
|
|
|
int b_calculate_psnr;
|
|
|
|
|
|
|
|
int droppable;
|
|
|
|
|
|
|
|
int initial_width;
|
|
|
|
int initial_height;
|
|
|
|
int initial_mbs; // Number of MBs in the full-size frame; to be used to
|
|
|
|
// normalize the firstpass stats. This will differ from the
|
|
|
|
// number of MBs in the current frame when the frame is
|
|
|
|
// scaled.
|
|
|
|
|
|
|
|
// Store frame variance info in SOURCE_VAR_BASED_PARTITION search type.
|
2016-10-15 02:51:44 +03:00
|
|
|
DIFF *source_diff_var;
|
2015-08-06 05:00:31 +03:00
|
|
|
// The threshold used in SOURCE_VAR_BASED_PARTITION search type.
|
|
|
|
unsigned int source_var_thresh;
|
|
|
|
int frames_till_next_var_check;
|
|
|
|
|
|
|
|
int frame_flags;
|
|
|
|
|
|
|
|
search_site_config ss_cfg;
|
|
|
|
|
2015-12-30 21:27:19 +03:00
|
|
|
int mbmode_cost[BLOCK_SIZE_GROUPS][INTRA_MODES];
|
2015-12-02 21:59:01 +03:00
|
|
|
#if CONFIG_REF_MV
|
|
|
|
int newmv_mode_cost[NEWMV_MODE_CONTEXTS][2];
|
|
|
|
int zeromv_mode_cost[ZEROMV_MODE_CONTEXTS][2];
|
|
|
|
int refmv_mode_cost[REFMV_MODE_CONTEXTS][2];
|
2016-01-22 05:07:31 +03:00
|
|
|
int drl_mode_cost0[DRL_MODE_CONTEXTS][2];
|
2016-01-08 02:13:52 +03:00
|
|
|
#if CONFIG_EXT_INTER
|
|
|
|
int new2mv_mode_cost[2];
|
|
|
|
#endif // CONFIG_EXT_INTER
|
2015-12-02 21:59:01 +03:00
|
|
|
#endif
|
|
|
|
|
2015-08-06 05:00:31 +03:00
|
|
|
unsigned int inter_mode_cost[INTER_MODE_CONTEXTS][INTER_MODES];
|
2016-01-20 03:45:45 +03:00
|
|
|
#if CONFIG_EXT_INTER
|
2016-09-08 08:40:40 +03:00
|
|
|
unsigned int inter_compound_mode_cost[INTER_MODE_CONTEXTS]
|
|
|
|
[INTER_COMPOUND_MODES];
|
2016-03-31 03:33:15 +03:00
|
|
|
unsigned int interintra_mode_cost[BLOCK_SIZE_GROUPS][INTERINTRA_MODES];
|
2016-01-20 03:45:45 +03:00
|
|
|
#endif // CONFIG_EXT_INTER
|
2016-10-14 01:18:22 +03:00
|
|
|
#if CONFIG_MOTION_VAR || CONFIG_WARPED_MOTION
|
|
|
|
int motion_mode_cost[BLOCK_SIZES][MOTION_MODES];
|
2016-09-09 00:48:15 +03:00
|
|
|
#if CONFIG_MOTION_VAR && CONFIG_WARPED_MOTION
|
|
|
|
int motion_mode_cost1[BLOCK_SIZES][2];
|
|
|
|
#endif // CONFIG_MOTION_VAR && CONFIG_WARPED_MOTION
|
2016-10-14 01:18:22 +03:00
|
|
|
#endif // CONFIG_MOTION_VAR || CONFIG_WARPED_MOTION
|
2015-11-07 00:56:51 +03:00
|
|
|
int intra_uv_mode_cost[INTRA_MODES][INTRA_MODES];
|
2015-08-06 05:00:31 +03:00
|
|
|
int y_mode_costs[INTRA_MODES][INTRA_MODES][INTRA_MODES];
|
|
|
|
int switchable_interp_costs[SWITCHABLE_FILTER_CONTEXTS][SWITCHABLE_FILTERS];
|
2016-03-17 19:50:28 +03:00
|
|
|
#if CONFIG_EXT_PARTITION_TYPES
|
|
|
|
int partition_cost[PARTITION_CONTEXTS][EXT_PARTITION_TYPES];
|
|
|
|
#else
|
2015-08-06 05:00:31 +03:00
|
|
|
int partition_cost[PARTITION_CONTEXTS][PARTITION_TYPES];
|
2016-03-17 19:50:28 +03:00
|
|
|
#endif
|
2016-10-13 02:28:56 +03:00
|
|
|
#if CONFIG_PALETTE
|
2015-12-08 05:18:57 +03:00
|
|
|
int palette_y_size_cost[PALETTE_BLOCK_SIZES][PALETTE_SIZES];
|
|
|
|
int palette_uv_size_cost[PALETTE_BLOCK_SIZES][PALETTE_SIZES];
|
2016-09-08 08:40:40 +03:00
|
|
|
int palette_y_color_cost[PALETTE_MAX_SIZE - 1][PALETTE_COLOR_CONTEXTS]
|
|
|
|
[PALETTE_COLORS];
|
|
|
|
int palette_uv_color_cost[PALETTE_MAX_SIZE - 1][PALETTE_COLOR_CONTEXTS]
|
|
|
|
[PALETTE_COLORS];
|
2016-10-13 02:28:56 +03:00
|
|
|
#endif // CONFIG_PALETTE
|
2016-03-08 02:25:50 +03:00
|
|
|
int tx_size_cost[TX_SIZES - 1][TX_SIZE_CONTEXTS][TX_SIZES];
|
2015-09-03 12:58:12 +03:00
|
|
|
#if CONFIG_EXT_TX
|
2015-10-12 22:30:55 +03:00
|
|
|
int inter_tx_type_costs[EXT_TX_SETS_INTER][EXT_TX_SIZES][TX_TYPES];
|
|
|
|
int intra_tx_type_costs[EXT_TX_SETS_INTRA][EXT_TX_SIZES][INTRA_MODES]
|
2016-08-12 06:13:14 +03:00
|
|
|
[TX_TYPES];
|
2016-01-11 21:27:35 +03:00
|
|
|
#else
|
2016-01-06 22:24:57 +03:00
|
|
|
int intra_tx_type_costs[EXT_TX_SIZES][TX_TYPES][TX_TYPES];
|
|
|
|
int inter_tx_type_costs[EXT_TX_SIZES][TX_TYPES];
|
2015-09-03 12:58:12 +03:00
|
|
|
#endif // CONFIG_EXT_TX
|
2016-01-13 03:38:58 +03:00
|
|
|
#if CONFIG_EXT_INTRA
|
2016-12-07 03:58:23 +03:00
|
|
|
#if CONFIG_INTRA_INTERP
|
2016-01-13 03:38:58 +03:00
|
|
|
int intra_filter_cost[INTRA_FILTERS + 1][INTRA_FILTERS];
|
2016-12-07 03:58:23 +03:00
|
|
|
#endif // CONFIG_INTRA_INTERP
|
2016-01-13 03:38:58 +03:00
|
|
|
#endif // CONFIG_EXT_INTRA
|
2016-09-09 01:15:17 +03:00
|
|
|
#if CONFIG_LOOP_RESTORATION
|
|
|
|
int switchable_restore_cost[RESTORE_SWITCHABLE_TYPES];
|
|
|
|
#endif // CONFIG_LOOP_RESTORATION
|
2016-12-08 00:20:44 +03:00
|
|
|
#if CONFIG_GLOBAL_MOTION
|
|
|
|
int gmtype_cost[TRANS_TYPES];
|
|
|
|
#endif // CONFIG_GLOBAL_MOTION
|
2016-01-13 03:38:58 +03:00
|
|
|
|
|
|
|
int multi_arf_allowed;
|
|
|
|
int multi_arf_enabled;
|
|
|
|
int multi_arf_last_grp_enabled;
|
2016-03-11 20:42:49 +03:00
|
|
|
|
|
|
|
TileDataEnc *tile_data;
|
|
|
|
int allocated_tiles; // Keep track of memory allocated for tiles.
|
|
|
|
|
|
|
|
TOKENEXTRA *tile_tok[MAX_TILE_ROWS][MAX_TILE_COLS];
|
|
|
|
unsigned int tok_count[MAX_TILE_ROWS][MAX_TILE_COLS];
|
|
|
|
|
|
|
|
TileBufferEnc tile_buffers[MAX_TILE_ROWS][MAX_TILE_COLS];
|
|
|
|
|
2015-08-06 05:00:31 +03:00
|
|
|
int resize_pending;
|
|
|
|
int resize_state;
|
|
|
|
int resize_scale_num;
|
|
|
|
int resize_scale_den;
|
|
|
|
int resize_avg_qp;
|
|
|
|
int resize_buffer_underflow;
|
|
|
|
int resize_count;
|
|
|
|
|
|
|
|
// VAR_BASED_PARTITION thresholds
|
2016-04-11 19:41:58 +03:00
|
|
|
// 0 - threshold_128x128;
|
|
|
|
// 1 - threshold_64x64;
|
|
|
|
// 2 - threshold_32x32;
|
|
|
|
// 3 - threshold_16x16;
|
|
|
|
// 4 - threshold_8x8;
|
|
|
|
int64_t vbp_thresholds[5];
|
2015-08-06 05:00:31 +03:00
|
|
|
int64_t vbp_threshold_minmax;
|
|
|
|
int64_t vbp_threshold_sad;
|
|
|
|
BLOCK_SIZE vbp_bsize_min;
|
|
|
|
|
2016-06-09 17:12:27 +03:00
|
|
|
// VARIANCE_AQ segment map refresh
|
|
|
|
int vaq_refresh;
|
|
|
|
|
2015-08-06 05:00:31 +03:00
|
|
|
// Multi-threading
|
|
|
|
int num_workers;
|
2016-08-31 00:01:10 +03:00
|
|
|
AVxWorker *workers;
|
2015-08-06 05:00:31 +03:00
|
|
|
struct EncWorkerData *tile_thr_data;
|
2016-08-31 00:01:10 +03:00
|
|
|
AV1LfSync lf_row_sync;
|
2016-01-08 01:29:26 +03:00
|
|
|
#if CONFIG_ENTROPY
|
|
|
|
SUBFRAME_STATS subframe_stats;
|
2016-05-11 00:42:27 +03:00
|
|
|
// TODO(yaowu): minimize the size of count buffers
|
|
|
|
SUBFRAME_STATS wholeframe_stats;
|
2016-08-31 00:01:10 +03:00
|
|
|
av1_coeff_stats branch_ct_buf[COEF_PROBS_BUFS][TX_SIZES][PLANE_TYPES];
|
2016-01-08 01:29:26 +03:00
|
|
|
#endif // CONFIG_ENTROPY
|
2016-04-14 00:53:34 +03:00
|
|
|
#if CONFIG_ANS
|
|
|
|
struct BufAnsCoder buf_ans;
|
|
|
|
#endif
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2016-02-04 20:47:46 +03:00
|
|
|
int refresh_frame_mask;
|
|
|
|
int existing_fb_idx_to_show;
|
2016-07-27 00:41:15 +03:00
|
|
|
int is_arf_filter_off[MAX_EXT_ARFS + 1];
|
|
|
|
int num_extra_arfs;
|
|
|
|
int arf_map[MAX_EXT_ARFS + 1];
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2016-07-11 21:47:55 +03:00
|
|
|
#if CONFIG_GLOBAL_MOTION
|
2016-11-22 19:55:49 +03:00
|
|
|
// Stores number of prediction blocks using global motion and the
|
|
|
|
// number of 4x4 blocks using it per reference frame.
|
|
|
|
int global_motion_used[TOTAL_REFS_PER_FRAME][2];
|
2016-11-16 03:07:12 +03:00
|
|
|
int global_motion_search_done;
|
2016-07-11 21:47:55 +03:00
|
|
|
#endif
|
2016-11-09 15:32:54 +03:00
|
|
|
#if CONFIG_REFERENCE_BUFFER
|
|
|
|
SequenceHeader seq_params;
|
|
|
|
#endif
|
2016-08-31 00:01:10 +03:00
|
|
|
} AV1_COMP;
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_initialize_enc(void);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
struct AV1_COMP *av1_create_compressor(AV1EncoderConfig *oxcf,
|
|
|
|
BufferPool *const pool);
|
|
|
|
void av1_remove_compressor(AV1_COMP *cpi);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_change_config(AV1_COMP *cpi, const AV1EncoderConfig *oxcf);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-12 06:13:14 +03:00
|
|
|
// receive a frames worth of data. caller can assume that a copy of this
|
|
|
|
// frame is made and not just a copy of the pointer..
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_receive_raw_frame(AV1_COMP *cpi, unsigned int frame_flags,
|
|
|
|
YV12_BUFFER_CONFIG *sd, int64_t time_stamp,
|
|
|
|
int64_t end_time_stamp);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_get_compressed_data(AV1_COMP *cpi, unsigned int *frame_flags,
|
|
|
|
size_t *size, uint8_t *dest, int64_t *time_stamp,
|
|
|
|
int64_t *time_end, int flush);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_get_preview_raw_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *dest);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_get_last_show_frame(AV1_COMP *cpi, YV12_BUFFER_CONFIG *frame);
|
2016-05-20 02:46:10 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_use_as_reference(AV1_COMP *cpi, int ref_frame_flags);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_update_reference(AV1_COMP *cpi, int ref_frame_flags);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_copy_reference_enc(AV1_COMP *cpi, AOM_REFFRAME ref_frame_flag,
|
2016-08-12 06:13:14 +03:00
|
|
|
YV12_BUFFER_CONFIG *sd);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_set_reference_enc(AV1_COMP *cpi, AOM_REFFRAME ref_frame_flag,
|
|
|
|
YV12_BUFFER_CONFIG *sd);
|
|
|
|
|
|
|
|
int av1_update_entropy(AV1_COMP *cpi, int update);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_set_active_map(AV1_COMP *cpi, unsigned char *map, int rows, int cols);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_get_active_map(AV1_COMP *cpi, unsigned char *map, int rows, int cols);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_set_internal_size(AV1_COMP *cpi, AOM_SCALING horiz_mode,
|
|
|
|
AOM_SCALING vert_mode);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_set_size_literal(AV1_COMP *cpi, unsigned int width,
|
|
|
|
unsigned int height);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
int av1_get_quantizer(struct AV1_COMP *cpi);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_full_to_model_counts(av1_coeff_count_model *model_count,
|
|
|
|
av1_coeff_count *full_count);
|
2016-01-08 01:29:26 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
static INLINE int frame_is_kf_gf_arf(const AV1_COMP *cpi) {
|
2016-08-12 06:13:14 +03:00
|
|
|
return frame_is_intra_only(&cpi->common) || cpi->refresh_alt_ref_frame ||
|
2015-08-06 05:00:31 +03:00
|
|
|
(cpi->refresh_golden_frame && !cpi->rc.is_src_frame_alt_ref);
|
|
|
|
}
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
static INLINE int get_ref_frame_map_idx(const AV1_COMP *cpi,
|
2015-08-06 05:00:31 +03:00
|
|
|
MV_REFERENCE_FRAME ref_frame) {
|
2015-11-12 13:12:17 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
if (ref_frame >= LAST_FRAME && ref_frame <= LAST3_FRAME)
|
2015-12-03 03:27:46 +03:00
|
|
|
return cpi->lst_fb_idxes[ref_frame - 1];
|
|
|
|
#else
|
2016-08-12 06:13:14 +03:00
|
|
|
if (ref_frame == LAST_FRAME) return cpi->lst_fb_idx;
|
2015-11-12 13:12:17 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2015-12-03 03:27:46 +03:00
|
|
|
else if (ref_frame == GOLDEN_FRAME)
|
2015-08-06 05:00:31 +03:00
|
|
|
return cpi->gld_fb_idx;
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2016-02-04 20:47:46 +03:00
|
|
|
else if (ref_frame == BWDREF_FRAME)
|
|
|
|
return cpi->bwd_fb_idx;
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2015-12-03 03:27:46 +03:00
|
|
|
else
|
2015-08-06 05:00:31 +03:00
|
|
|
return cpi->alt_fb_idx;
|
|
|
|
}
|
|
|
|
|
2016-10-14 03:27:51 +03:00
|
|
|
static INLINE int get_ref_frame_buf_idx(const AV1_COMP *cpi,
|
2016-05-19 01:47:04 +03:00
|
|
|
MV_REFERENCE_FRAME ref_frame) {
|
2016-08-31 00:01:10 +03:00
|
|
|
const AV1_COMMON *const cm = &cpi->common;
|
2015-08-06 05:00:31 +03:00
|
|
|
const int map_idx = get_ref_frame_map_idx(cpi, ref_frame);
|
|
|
|
return (map_idx != INVALID_IDX) ? cm->ref_frame_map[map_idx] : INVALID_IDX;
|
|
|
|
}
|
|
|
|
|
|
|
|
static INLINE YV12_BUFFER_CONFIG *get_ref_frame_buffer(
|
2016-10-14 03:27:51 +03:00
|
|
|
const AV1_COMP *cpi, MV_REFERENCE_FRAME ref_frame) {
|
|
|
|
const AV1_COMMON *const cm = &cpi->common;
|
2015-08-06 05:00:31 +03:00
|
|
|
const int buf_idx = get_ref_frame_buf_idx(cpi, ref_frame);
|
2016-08-12 06:13:14 +03:00
|
|
|
return buf_idx != INVALID_IDX ? &cm->buffer_pool->frame_bufs[buf_idx].buf
|
|
|
|
: NULL;
|
2015-08-06 05:00:31 +03:00
|
|
|
}
|
|
|
|
|
2016-05-19 01:47:04 +03:00
|
|
|
static INLINE const YV12_BUFFER_CONFIG *get_upsampled_ref(
|
2016-10-14 03:27:51 +03:00
|
|
|
const AV1_COMP *cpi, const MV_REFERENCE_FRAME ref_frame) {
|
2016-05-19 01:47:04 +03:00
|
|
|
// Use up-sampled reference frames.
|
|
|
|
const int buf_idx =
|
|
|
|
cpi->upsampled_ref_idx[get_ref_frame_map_idx(cpi, ref_frame)];
|
|
|
|
return &cpi->upsampled_ref_bufs[buf_idx].buf;
|
|
|
|
}
|
|
|
|
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#if CONFIG_EXT_REFS
|
2016-08-31 00:01:10 +03:00
|
|
|
static INLINE int enc_is_ref_frame_buf(AV1_COMP *cpi, RefCntBuffer *frame_buf) {
|
2016-05-25 21:57:15 +03:00
|
|
|
MV_REFERENCE_FRAME ref_frame;
|
2016-08-31 00:01:10 +03:00
|
|
|
AV1_COMMON *const cm = &cpi->common;
|
2016-05-25 21:57:15 +03:00
|
|
|
for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
|
|
|
|
const int buf_idx = get_ref_frame_buf_idx(cpi, ref_frame);
|
|
|
|
if (buf_idx == INVALID_IDX) continue;
|
|
|
|
if (frame_buf == &cm->buffer_pool->frame_bufs[buf_idx]) break;
|
|
|
|
}
|
|
|
|
return (ref_frame <= ALTREF_FRAME);
|
|
|
|
}
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2016-05-25 21:57:15 +03:00
|
|
|
|
2016-03-11 20:42:49 +03:00
|
|
|
static INLINE unsigned int get_token_alloc(int mb_rows, int mb_cols) {
|
2016-07-29 20:48:34 +03:00
|
|
|
// We assume 3 planes all at full resolution. We assume up to 1 token per
|
|
|
|
// pixel, and then allow a head room of 1 EOSB token per 4x4 block per plane,
|
|
|
|
// plus EOSB_TOKEN per plane.
|
|
|
|
return mb_rows * mb_cols * (16 * 16 + 17) * 3;
|
2015-08-06 05:00:31 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
// Get the allocated token size for a tile. It does the same calculation as in
|
|
|
|
// the frame token allocation.
|
2016-03-11 20:42:49 +03:00
|
|
|
static INLINE unsigned int allocated_tokens(TileInfo tile) {
|
2015-08-06 05:00:31 +03:00
|
|
|
int tile_mb_rows = (tile.mi_row_end - tile.mi_row_start + 1) >> 1;
|
|
|
|
int tile_mb_cols = (tile.mi_col_end - tile.mi_col_start + 1) >> 1;
|
|
|
|
|
|
|
|
return get_token_alloc(tile_mb_rows, tile_mb_cols);
|
|
|
|
}
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_alloc_compressor_data(AV1_COMP *cpi);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_scale_references(AV1_COMP *cpi);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_update_reference_frames(AV1_COMP *cpi);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_set_high_precision_mv(AV1_COMP *cpi, int allow_high_precision_mv);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
YV12_BUFFER_CONFIG *av1_scale_if_required_fast(AV1_COMMON *cm,
|
|
|
|
YV12_BUFFER_CONFIG *unscaled,
|
|
|
|
YV12_BUFFER_CONFIG *scaled);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
YV12_BUFFER_CONFIG *av1_scale_if_required(AV1_COMMON *cm,
|
|
|
|
YV12_BUFFER_CONFIG *unscaled,
|
|
|
|
YV12_BUFFER_CONFIG *scaled);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_apply_encoding_flags(AV1_COMP *cpi, aom_enc_frame_flags_t flags);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
static INLINE int is_altref_enabled(const AV1_COMP *const cpi) {
|
2015-08-06 05:00:31 +03:00
|
|
|
return cpi->oxcf.mode != REALTIME && cpi->oxcf.lag_in_frames > 0 &&
|
2015-08-28 01:11:38 +03:00
|
|
|
cpi->oxcf.enable_auto_arf;
|
2015-08-06 05:00:31 +03:00
|
|
|
}
|
|
|
|
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
// TODO(zoeliu): To set up cpi->oxcf.enable_auto_brf
|
|
|
|
#if 0 && CONFIG_EXT_REFS
|
2016-08-31 00:01:10 +03:00
|
|
|
static INLINE int is_bwdref_enabled(const AV1_COMP *const cpi) {
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
// NOTE(zoeliu): The enabling of bi-predictive frames depends on the use of
|
|
|
|
// alt_ref, and now will be off when the alt_ref interval is
|
|
|
|
// not sufficiently large.
|
|
|
|
return is_altref_enabled(cpi) && cpi->oxcf.enable_auto_brf;
|
2016-02-04 20:47:46 +03:00
|
|
|
}
|
Merge bi-predictive frames to EXT_REFS
This patch removed the experiment of BIDIR_PRED and merged the feature
into the experiment of EXT_REFS:
(1) Each frame now has up to 6 reference frames, namely
LAST_FRAME, LAST2_FRAME, LAST3_FRAME, GOLDEN_FRAME, (forward) and
BWDREF_FRAME, ALTREF_FRAME (backward);
LAST4_FRAME has been removed;
(2) First pass still keeps the 8 updates:
KF_UPDATE, LF_UPDATE, GF_UPDATE, ARF_UPDATE, OVERLAY_UPDATE, and
BRF_UPDATE, LAST_BIPRED_UPDATE, BI_PRED_UPDATE;
(3) show_existing_frame==1 is supported in the experiment of EXT_REFS;
(4) New encoding modes are added for both single-ref and compound cases,
through the use of the 2 extra forward references (LAST2 & LAST3)
and the 1 extra backward reference (BWDREF).
RD performance wise, using Overall PSNR: Avg/BDRate
Bipred only Prev EXT_REFS Current EXT_REFS with bipred
lowres: -3.474/-3.324 -1.748/-1.586 -4.613/-4.387
derflr: -2.097/-1.353 -1.439/-1.215 -3.120/-2.252
midres: -2.129/-1.901 -1.345/-1.185 -2.898/-2.636
If in vp10/encoder/firstpass.h, change BFG_INTERVAL from 2 to 3, i.e. to
use 2 bi-predictive frames than 1, a further improvement may be
obtained:
Current EXT_REFS with bipred
1 bi-predictive frame 2 bi-predictive frames
lowres: -4.613/-4.387 -4.675/-4.465
derflr: -3.120/-2.252 -3.333/-2.516
midres: -2.898/-2.636 -3.406/-3.095
Change-Id: Ib06fe9ea0a5cfd7418a1d79b978ee9d80bf191cb
2016-06-09 00:27:56 +03:00
|
|
|
#endif // CONFIG_EXT_REFS
|
2016-02-04 20:47:46 +03:00
|
|
|
|
2016-10-14 03:27:51 +03:00
|
|
|
static INLINE void set_ref_ptrs(const AV1_COMMON *cm, MACROBLOCKD *xd,
|
2015-08-06 05:00:31 +03:00
|
|
|
MV_REFERENCE_FRAME ref0,
|
|
|
|
MV_REFERENCE_FRAME ref1) {
|
2016-08-12 06:13:14 +03:00
|
|
|
xd->block_refs[0] =
|
|
|
|
&cm->frame_refs[ref0 >= LAST_FRAME ? ref0 - LAST_FRAME : 0];
|
|
|
|
xd->block_refs[1] =
|
|
|
|
&cm->frame_refs[ref1 >= LAST_FRAME ? ref1 - LAST_FRAME : 0];
|
2015-08-06 05:00:31 +03:00
|
|
|
}
|
|
|
|
|
|
|
|
static INLINE int get_chessboard_index(const int frame_index) {
|
|
|
|
return frame_index & 0x1;
|
|
|
|
}
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
static INLINE int *cond_cost_list(const struct AV1_COMP *cpi, int *cost_list) {
|
2015-08-06 05:00:31 +03:00
|
|
|
return cpi->sf.mv.subpel_search_method != SUBPEL_TREE ? cost_list : NULL;
|
|
|
|
}
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
void av1_new_framerate(AV1_COMP *cpi, double framerate);
|
2015-08-06 05:00:31 +03:00
|
|
|
|
|
|
|
#define LAYER_IDS_TO_IDX(sl, tl, num_tl) ((sl) * (num_tl) + (tl))
|
|
|
|
|
2016-02-17 01:33:18 +03:00
|
|
|
// Update up-sampled reference frame index.
|
|
|
|
static INLINE void uref_cnt_fb(EncRefCntBuffer *ubufs, int *uidx,
|
|
|
|
int new_uidx) {
|
|
|
|
const int ref_index = *uidx;
|
|
|
|
|
|
|
|
if (ref_index >= 0 && ubufs[ref_index].ref_count > 0)
|
|
|
|
ubufs[ref_index].ref_count--;
|
|
|
|
|
|
|
|
*uidx = new_uidx;
|
|
|
|
ubufs[new_uidx].ref_count++;
|
|
|
|
}
|
|
|
|
|
2016-03-02 00:16:03 +03:00
|
|
|
#ifdef __cplusplus
|
|
|
|
} // extern "C"
|
|
|
|
#endif
|
|
|
|
|
2016-08-31 00:01:10 +03:00
|
|
|
#endif // AV1_ENCODER_ENCODER_H_
|