summaryrefslogtreecommitdiff
diff options
context:
space:
mode:
-rw-r--r--vp9/encoder/vp9_encodeframe.c99
-rw-r--r--vp9/encoder/vp9_encodeframe.h3
-rw-r--r--vp9/encoder/vp9_encoder.c15
-rw-r--r--vp9/encoder/vp9_encoder.h14
4 files changed, 130 insertions, 1 deletions
diff --git a/vp9/encoder/vp9_encodeframe.c b/vp9/encoder/vp9_encodeframe.c
index 8449474d4..22b5f06ac 100644
--- a/vp9/encoder/vp9_encodeframe.c
+++ b/vp9/encoder/vp9_encodeframe.c
@@ -3583,6 +3583,8 @@ static int wiener_var_rdmult(VP9_COMP *cpi, BLOCK_SIZE bsize, int mi_row,
int row, col;
int64_t rdmult;
int64_t wiener_variance = 0;
+ KMEANS_DATA *kmeans_data;
+ vpx_clear_system_state();
assert(cpi->norm_wiener_variance > 0);
@@ -3590,10 +3592,12 @@ static int wiener_var_rdmult(VP9_COMP *cpi, BLOCK_SIZE bsize, int mi_row,
for (col = mb_col_start; col < mb_col_end; ++col)
wiener_variance += cpi->mb_wiener_variance[row * cm->mb_cols + col];
+ kmeans_data = &cpi->kmeans_data_arr[cpi->kmeans_data_size++];
+ kmeans_data->value = log(1 + wiener_variance);
+ kmeans_data->pos = mi_row * cpi->kmeans_data_stride + mi_col;
if (wiener_variance)
wiener_variance /=
(mb_row_end - mb_row_start) * (mb_col_end - mb_col_start);
-
rdmult = (orig_rdmult * wiener_variance) / cpi->norm_wiener_variance;
rdmult = VPXMIN(rdmult, orig_rdmult * 3);
@@ -5673,6 +5677,89 @@ static int input_fpmb_stats(FIRSTPASS_MB_STATS *firstpass_mb_stats,
}
#endif
+static int compare_kmeans_data(const void *a, const void *b) {
+ if (((const KMEANS_DATA *)a)->value > ((const KMEANS_DATA *)b)->value) {
+ return 1;
+ } else if (((const KMEANS_DATA *)a)->value <
+ ((const KMEANS_DATA *)b)->value) {
+ return -1;
+ } else {
+ return 0;
+ }
+}
+
+void vp9_kmeans(double *ctr_ls, int k, KMEANS_DATA *arr, int size) {
+ double min, max;
+ double step;
+ int i, j;
+ int itr;
+ double boundary_ls[MAX_KMEANS_GROUPS] = { 0 };
+ int group_idx;
+ double sum;
+ int count;
+
+ vpx_clear_system_state();
+
+ assert(k >= 2 && k <= MAX_KMEANS_GROUPS);
+
+ qsort(arr, size, sizeof(*arr), compare_kmeans_data);
+
+ min = arr[0].value;
+ max = arr[size - 1].value;
+
+ // initialize the center points
+ step = (max - min) * 1. / k;
+ for (j = 0; j < k; ++j) {
+ ctr_ls[j] = min + j * step + step / 2;
+ }
+
+ for (itr = 0; itr < 10; ++itr) {
+ for (j = 0; j < k - 1; ++j) {
+ boundary_ls[j] = (ctr_ls[j] + ctr_ls[j + 1]) / 2.;
+ }
+ boundary_ls[k - 1] = max + 1;
+
+ group_idx = 0;
+ count = 0;
+ sum = 0;
+ for (i = 0; i < size; ++i) {
+ while (arr[i].value >= boundary_ls[group_idx]) {
+ ++group_idx;
+ if (group_idx == k - 1) {
+ break;
+ }
+ }
+
+ sum += arr[i].value;
+ ++count;
+
+ if (i + 1 == size || arr[i + 1].value >= boundary_ls[group_idx]) {
+ if (count > 0) {
+ ctr_ls[group_idx] = sum / count;
+ }
+ count = 0;
+ sum = 0;
+ }
+ }
+ }
+
+ // compute group_idx
+ for (j = 0; j < k - 1; ++j) {
+ boundary_ls[j] = (ctr_ls[j] + ctr_ls[j + 1]) / 2.;
+ }
+ boundary_ls[k - 1] = max + 1;
+ group_idx = 0;
+ for (i = 0; i < size; ++i) {
+ while (arr[i].value >= boundary_ls[group_idx]) {
+ ++group_idx;
+ if (group_idx == k - 1) {
+ break;
+ }
+ }
+ arr[i].group_idx = group_idx;
+ }
+}
+
static void encode_frame_internal(VP9_COMP *cpi) {
SPEED_FEATURES *const sf = &cpi->sf;
ThreadData *const td = &cpi->td;
@@ -5782,6 +5869,11 @@ static void encode_frame_internal(VP9_COMP *cpi) {
}
#endif
+ if (cpi->sf.enable_wiener_variance && cm->show_frame) {
+ cpi->kmeans_data_size = 0;
+ cpi->kmeans_ctr_num = 5;
+ }
+
if (!cpi->row_mt) {
cpi->row_mt_sync_read_ptr = vp9_row_mt_sync_read_dummy;
cpi->row_mt_sync_write_ptr = vp9_row_mt_sync_write_dummy;
@@ -5797,6 +5889,11 @@ static void encode_frame_internal(VP9_COMP *cpi) {
vp9_encode_tiles_row_mt(cpi);
}
+ if (cpi->sf.enable_wiener_variance && cm->show_frame) {
+ vp9_kmeans(cpi->kmeans_ctr_ls, cpi->kmeans_ctr_num, cpi->kmeans_data_arr,
+ cpi->kmeans_data_size);
+ }
+
vpx_usec_timer_mark(&emr_timer);
cpi->time_encode_sb_row += vpx_usec_timer_elapsed(&emr_timer);
}
diff --git a/vp9/encoder/vp9_encodeframe.h b/vp9/encoder/vp9_encodeframe.h
index 1798c0048..a761ae68b 100644
--- a/vp9/encoder/vp9_encodeframe.h
+++ b/vp9/encoder/vp9_encodeframe.h
@@ -45,6 +45,9 @@ void vp9_encode_sb_row(struct VP9_COMP *cpi, struct ThreadData *td,
void vp9_set_variance_partition_thresholds(struct VP9_COMP *cpi, int q,
int content_state);
+struct KMEANS_DATA;
+void vp9_kmeans(double *ctr_ls, int k, struct KMEANS_DATA *arr, int size);
+
#ifdef __cplusplus
} // extern "C"
#endif
diff --git a/vp9/encoder/vp9_encoder.c b/vp9/encoder/vp9_encoder.c
index 3c9ae1bb1..edad53d31 100644
--- a/vp9/encoder/vp9_encoder.c
+++ b/vp9/encoder/vp9_encoder.c
@@ -2388,6 +2388,7 @@ VP9_COMP *vp9_create_compressor(VP9EncoderConfig *oxcf,
sizeof(*cpi->mb_wiener_variance)));
}
+ cpi->kmeans_data_arr_alloc = 0;
#if CONFIG_NON_GREEDY_MV
cpi->feature_score_loc_alloc = 0;
cpi->tpl_ready = 0;
@@ -2591,6 +2592,10 @@ void vp9_remove_compressor(VP9_COMP *cpi) {
vp9_denoiser_free(&(cpi->denoiser));
#endif
+ if (cpi->kmeans_data_arr_alloc) {
+ vpx_free(cpi->kmeans_data_arr);
+ }
+
#if CONFIG_NON_GREEDY_MV
vpx_free(cpi->feature_score_loc_arr);
vpx_free(cpi->feature_score_loc_sort);
@@ -7250,6 +7255,16 @@ int vp9_get_compressed_data(VP9_COMP *cpi, unsigned int *frame_flags,
for (i = 0; i < REFS_PER_FRAME; ++i) cpi->scaled_ref_idx[i] = INVALID_IDX;
}
+ if (cpi->kmeans_data_arr_alloc == 0) {
+ const int mi_cols = mi_cols_aligned_to_sb(cm->mi_cols);
+ const int mi_rows = mi_cols_aligned_to_sb(cm->mi_rows);
+ CHECK_MEM_ERROR(
+ cm, cpi->kmeans_data_arr,
+ vpx_calloc(mi_rows * mi_cols, sizeof(*cpi->kmeans_data_arr)));
+ cpi->kmeans_data_stride = mi_cols;
+ cpi->kmeans_data_arr_alloc = 1;
+ }
+
if (gf_group_index == 1 &&
cpi->twopass.gf_group.update_type[gf_group_index] == ARF_UPDATE &&
cpi->sf.enable_tpl_model) {
diff --git a/vp9/encoder/vp9_encoder.h b/vp9/encoder/vp9_encoder.h
index e578646b9..278408fd5 100644
--- a/vp9/encoder/vp9_encoder.h
+++ b/vp9/encoder/vp9_encoder.h
@@ -567,6 +567,14 @@ typedef struct FEATURE_SCORE_LOC {
} FEATURE_SCORE_LOC;
#endif
+#define MAX_KMEANS_GROUPS 8
+
+typedef struct KMEANS_DATA {
+ double value;
+ int pos;
+ int group_idx;
+} KMEANS_DATA;
+
typedef struct VP9_COMP {
QUANTS quants;
ThreadData td;
@@ -594,6 +602,12 @@ typedef struct VP9_COMP {
TplDepFrame tpl_stats[MAX_ARF_GOP_SIZE];
YV12_BUFFER_CONFIG *tpl_recon_frames[REF_FRAMES];
EncFrameBuf enc_frame_buf[REF_FRAMES];
+ int kmeans_data_arr_alloc;
+ KMEANS_DATA *kmeans_data_arr;
+ int kmeans_data_size;
+ int kmeans_data_stride;
+ double kmeans_ctr_ls[MAX_KMEANS_GROUPS];
+ int kmeans_ctr_num;
#if CONFIG_NON_GREEDY_MV
int tpl_ready;
int feature_score_loc_alloc;