diff options
author | Paul Wilkins <paulwilkins@google.com> | 2021-03-22 19:45:10 +0000 |
---|---|---|
committer | Paul Wilkins <paulwilkins@google.com> | 2021-03-23 15:05:32 +0000 |
commit | e37ee40f7ee0dbafa41e7d1c32dc34740727c7a1 (patch) | |
tree | 140156a811218a55e074d91031e3d92dcd04eb0c /vp9/encoder/vp9_rd.c | |
parent | 90c1cc651592f2dbad517ceb65dc0c0fef3d0dbc (diff) | |
download | libvpx-e37ee40f7ee0dbafa41e7d1c32dc34740727c7a1.tar libvpx-e37ee40f7ee0dbafa41e7d1c32dc34740727c7a1.tar.gz libvpx-e37ee40f7ee0dbafa41e7d1c32dc34740727c7a1.tar.bz2 libvpx-e37ee40f7ee0dbafa41e7d1c32dc34740727c7a1.zip |
Convert Vizier RD parameters to normalized factors
This patch converts the Vizier custom RD multipliers, to factors
that adjust each RD multiplier either side of its default value, where
a factor of 1.0 will give the previous default behavior.
Ultimately I would like to replace the multiple RD multipliers
triggered at different Q thresholds (eg, low, medium, high q)
with a function that adjusts the rd behavior smoothly as Q
changes.
Vizier could then be presented with a single adjustment control
for each of key frame and inter frame rd.
The current behavior is problematic.
Firstly having hard threshold Q values at which rd behavior changes
may cause anomalies in the rate distortion curve, where in some
situations, raising Q, for example, may not cause the expected drop
in rate and rise in distortion, because we have crossed a threshold
where the rate distortion multiplier changes sharply and this alters
the balance of bits spent in the prediction and residual parts of the
signal.
Having a single value that is used for a range of Q index values
(eg 0-64), (65-128) may also cause problems and over-fitting in
the context of the Vizier ML project. This project tries to optimize
the values for each Q range, for various YT formats, but does so
by analyzing the results of single point encodes on a set of clips.
For a given format all the clips are encoded with the same parameters
(target rate etc) so there is likely to be clustering in regards to the
Q values used. For example the training set may give a new value
for the Q range 0-64 but most of the data points used may have Q
close 64.
It will likely require several iterations working with the Vizier team
to get this right. This patch just gives an initial framework for
testing.
Change-Id: Iaa4cd5561b95a202bcae7a1d876c4f40ef444fa2
Diffstat (limited to 'vp9/encoder/vp9_rd.c')
-rw-r--r-- | vp9/encoder/vp9_rd.c | 117 |
1 files changed, 66 insertions, 51 deletions
diff --git a/vp9/encoder/vp9_rd.c b/vp9/encoder/vp9_rd.c index d5d668f96..d3bf3d6d4 100644 --- a/vp9/encoder/vp9_rd.c +++ b/vp9/encoder/vp9_rd.c @@ -205,65 +205,74 @@ void vp9_init_rd_parameters(VP9_COMP *cpi) { // Make sure this function is floating point safe. vpx_clear_system_state(); - rdc->rd_mult_q_sq_key_high_qp = 7.5; // No defined Vizer values yet + rdc->rd_mult_key_high_qp_fac = 1.0; // Default: no Vizer values yet if (0) { unsigned int screen_area = (cpi->common.width * cpi->common.height); if (screen_area <= 176 * 144) { - rdc->rd_mult_q_sq_inter_low_qp = 4.0718581295922025; - rdc->rd_mult_q_sq_inter_mid_qp = 4.031435609256739; - rdc->rd_mult_q_sq_inter_high_qp = 4.295745965132044; - rdc->rd_mult_q_sq_key_ultralow_qp = 4.290774097327333; - rdc->rd_mult_q_sq_key_low_qp = 5.7037775720838155; - rdc->rd_mult_q_sq_key_mid_qp = 4.72424015517201; + rdc->rd_mult_inter_low_qp_fac = 1.018; + rdc->rd_mult_inter_mid_qp_fac = 0.896; + rdc->rd_mult_inter_high_qp_fac = 1.432; + rdc->rd_mult_key_ultralow_qp_fac = 1.073; + rdc->rd_mult_key_low_qp_fac = 1.630; + rdc->rd_mult_key_mid_qp_fac = 1.050; } else if (screen_area <= 320 * 240) { - rdc->rd_mult_q_sq_inter_low_qp = 4.506676356706102; - rdc->rd_mult_q_sq_inter_mid_qp = 4.489349899621181; - rdc->rd_mult_q_sq_inter_high_qp = 4.388244213131458; - rdc->rd_mult_q_sq_key_ultralow_qp = 4.217074424696166; - rdc->rd_mult_q_sq_key_low_qp = 4.497000582319771; - rdc->rd_mult_q_sq_key_mid_qp = 4.2825894884789735; + rdc->rd_mult_inter_low_qp_fac = 1.127; + rdc->rd_mult_inter_mid_qp_fac = 0.998; + rdc->rd_mult_inter_high_qp_fac = 1.463; + rdc->rd_mult_key_ultralow_qp_fac = 1.054; + rdc->rd_mult_key_low_qp_fac = 1.285; + rdc->rd_mult_key_mid_qp_fac = 0.952; } else if (screen_area <= 640 * 360) { - rdc->rd_mult_q_sq_inter_low_qp = 4.730644123689013; - rdc->rd_mult_q_sq_inter_mid_qp = 4.314589509578551; - rdc->rd_mult_q_sq_inter_high_qp = 4.3702861603380025; - rdc->rd_mult_q_sq_key_ultralow_qp = 4.576902541873747; - rdc->rd_mult_q_sq_key_low_qp = 6.068652999601526; - rdc->rd_mult_q_sq_key_mid_qp = 4.817707474077241; + rdc->rd_mult_inter_low_qp_fac = 1.183; + rdc->rd_mult_inter_mid_qp_fac = 0.959; + rdc->rd_mult_inter_high_qp_fac = 1.457; + rdc->rd_mult_key_ultralow_qp_fac = 1.144; + rdc->rd_mult_key_low_qp_fac = 1.734; + rdc->rd_mult_key_mid_qp_fac = 1.071; } else if (screen_area <= 854 * 480) { - rdc->rd_mult_q_sq_inter_low_qp = 4.811470143416073; - rdc->rd_mult_q_sq_inter_mid_qp = 4.621618127750201; - rdc->rd_mult_q_sq_inter_high_qp = 3.969083125219539; - rdc->rd_mult_q_sq_key_ultralow_qp = 4.9854544277222566; - rdc->rd_mult_q_sq_key_low_qp = 5.073157238799473; - rdc->rd_mult_q_sq_key_mid_qp = 5.7587672849242635; + rdc->rd_mult_inter_low_qp_fac = 1.203; + rdc->rd_mult_inter_mid_qp_fac = 1.027; + rdc->rd_mult_inter_high_qp_fac = 1.027; + rdc->rd_mult_key_ultralow_qp_fac = 1.246; + rdc->rd_mult_key_low_qp_fac = 1.246; + rdc->rd_mult_key_mid_qp_fac = 1.280; } else if (screen_area <= 1280 * 720) { - rdc->rd_mult_q_sq_inter_low_qp = 5.119381136011107; - rdc->rd_mult_q_sq_inter_mid_qp = 4.518613675766538; - rdc->rd_mult_q_sq_inter_high_qp = 4.410712348825541; - rdc->rd_mult_q_sq_key_ultralow_qp = 3.9468491666607326; - rdc->rd_mult_q_sq_key_low_qp = 5.848703119971484; - rdc->rd_mult_q_sq_key_mid_qp = 5.368947246228739; + rdc->rd_mult_inter_low_qp_fac = 1.280; + rdc->rd_mult_inter_mid_qp_fac = 1.004; + rdc->rd_mult_inter_high_qp_fac = 1.470; + rdc->rd_mult_key_ultralow_qp_fac = 0.987; + rdc->rd_mult_key_low_qp_fac = 1.671; + rdc->rd_mult_key_mid_qp_fac = 1.193; } else { - rdc->rd_mult_q_sq_inter_low_qp = 6.00569815296199; - rdc->rd_mult_q_sq_inter_mid_qp = 3.932565684947023; - rdc->rd_mult_q_sq_inter_high_qp = 3.2141187537667797; - rdc->rd_mult_q_sq_key_ultralow_qp = 4.399795006320089; - rdc->rd_mult_q_sq_key_low_qp = 10.582906599488298; - rdc->rd_mult_q_sq_key_mid_qp = 6.274162346360692; + rdc->rd_mult_inter_low_qp_fac = 1.50; + rdc->rd_mult_inter_mid_qp_fac = 0.874; + rdc->rd_mult_inter_high_qp_fac = 1.07; + rdc->rd_mult_key_ultralow_qp_fac = 1.1; + rdc->rd_mult_key_low_qp_fac = 2.35; + rdc->rd_mult_key_mid_qp_fac = 0.837; } } else { // For now force defaults unless testing - rdc->rd_mult_q_sq_inter_low_qp = 4.0; - rdc->rd_mult_q_sq_inter_mid_qp = 4.5; - rdc->rd_mult_q_sq_inter_high_qp = 3.0; - rdc->rd_mult_q_sq_key_ultralow_qp = 4.0; - rdc->rd_mult_q_sq_key_low_qp = 3.5; - rdc->rd_mult_q_sq_key_mid_qp = 4.5; + rdc->rd_mult_inter_low_qp_fac = 1.0; + rdc->rd_mult_inter_mid_qp_fac = 1.0; + rdc->rd_mult_inter_high_qp_fac = 1.0; + rdc->rd_mult_key_ultralow_qp_fac = 1.0; + rdc->rd_mult_key_low_qp_fac = 1.0; + rdc->rd_mult_key_mid_qp_fac = 1.0; } } +// Default Rd multiplier values for Q ranges +#define INTER_LOW_QP_RDM 4.0 +#define INTER_MID_QP_RDM 4.5 +#define INTER_HIGH_QP_RDM 3.0 +#define KEY_ULOW_QP_RDM 4.0 +#define KEY_LOW_QP_RDM 3.5 +#define KEY_MID_QP_RDM 4.5 +#define KEY_HIGH_QP_RDM 7.5 + int vp9_compute_rd_mult_based_on_qindex(const VP9_COMP *cpi, int qindex) { const RD_CONTROL *rdc = &cpi->rd_ctrl; const int q = vp9_dc_quant(qindex, 0, cpi->common.bit_depth); @@ -275,22 +284,28 @@ int vp9_compute_rd_mult_based_on_qindex(const VP9_COMP *cpi, int qindex) { if (cpi->common.frame_type != KEY_FRAME) { if (qindex < 128) { - rdmult = (int)((double)rdmult * rdc->rd_mult_q_sq_inter_low_qp); + rdmult = (int)((double)rdmult * INTER_LOW_QP_RDM * + rdc->rd_mult_inter_low_qp_fac); } else if (qindex < 190) { - rdmult = (int)((double)rdmult * rdc->rd_mult_q_sq_inter_mid_qp); + rdmult = (int)((double)rdmult * INTER_MID_QP_RDM * + rdc->rd_mult_inter_mid_qp_fac); } else { - rdmult = (int)((double)rdmult * rdc->rd_mult_q_sq_inter_high_qp); + rdmult = (int)((double)rdmult * INTER_HIGH_QP_RDM * + rdc->rd_mult_inter_high_qp_fac); } } else { if (qindex < 64) { - rdmult = (int)((double)rdmult * rdc->rd_mult_q_sq_key_ultralow_qp); + rdmult = (int)((double)rdmult * KEY_ULOW_QP_RDM * + rdc->rd_mult_key_ultralow_qp_fac); } else if (qindex <= 128) { - rdmult = (int)((double)rdmult * rdc->rd_mult_q_sq_key_low_qp); + rdmult = + (int)((double)rdmult * KEY_LOW_QP_RDM * rdc->rd_mult_key_low_qp_fac); } else if (qindex < 190) { - rdmult = (int)((double)rdmult * rdc->rd_mult_q_sq_key_mid_qp); - + rdmult = + (int)((double)rdmult * KEY_MID_QP_RDM * rdc->rd_mult_key_mid_qp_fac); } else { - rdmult = (int)((double)rdmult * rdc->rd_mult_q_sq_key_high_qp); + rdmult = (int)((double)rdmult * KEY_HIGH_QP_RDM * + rdc->rd_mult_key_high_qp_fac); } } |