[CFL] Compute Average Over TX Block Instead of Pred Block When computing alpha, multiple averages are computed, one for each transform block. The CfL prediction now uses the transform block average instead of partition block average. This allows the decoder to build the CfL prediction by using only the collocated reconstructed luma values for the current transform size and not the entire partition. Results on Subset 1 (Compared to 0e81b97c with CfL) PSNR | PSNR Cb | PSNR Cr | PSNR HVS | SSIM | MS SSIM | CIEDE 2000 0.0180 | 0.2627 | 0.2274 | 0.0233 | 0.0301 | 0.0312 | 0.1506 A small regression is expected, this change was made to simplify hardware implementations. Change-Id: Ib2ce2a3053b85300c5c62ef0e3270af489568a38

commit: 03678940ccd19ed6f9f3d9658785b7d9f08b39d8 [log] [tgz]
author: Luc Trudeau <luc@trud.ca> Mon Jun 12 17:33:19 2017 -0400
committer: Luc Trudeau <luc@trud.ca> Thu Jul 06 09:37:38 2017 -0400
tree: 2c2c6f32b148bcbedf52e6926d17f835b106a543
parent: 5c453db29e1a6645d3bef4e8de0b4ae23e0db4f8 [diff] [blame]
diff --git a/av1/common/cfl.c b/av1/common/cfl.c
index 1ffea03..154df73 100644
--- a/av1/common/cfl.c
+++ b/av1/common/cfl.c

@@ -183,24 +183,41 @@
   cfl->dc_pred[CFL_PRED_V] = sum_v / num_pel;
 }
 
-static void cfl_compute_average(CFL_CTX *cfl) {
+static void cfl_compute_averages(CFL_CTX *cfl, TX_SIZE tx_size) {
   const int width = cfl->uv_width;
   const int height = cfl->uv_height;
-  const double num_pel = width * height;
+  const int tx_height = tx_size_high[tx_size];
+  const int tx_width = tx_size_wide[tx_size];
+  const int stride = width >> tx_size_wide_log2[tx_size];
+  const int block_row_stride = MAX_SB_SIZE << tx_size_high_log2[tx_size];
+  const double num_pel = tx_width * tx_height;
   // TODO(ltrudeau) Convert to uint16 for HBD support
   const uint8_t *y_pix = cfl->y_down_pix;
   // TODO(ltrudeau) Convert to uint16 for HBD support
+  const uint8_t *t_y_pix;
+  double *averages = cfl->y_averages;
 
   cfl_load(cfl, 0, 0, width, height);
 
-  int sum = 0;
-  for (int j = 0; j < height; j++) {
-    for (int i = 0; i < width; i++) {
-      sum += y_pix[i];
+  int a = 0;
+  for (int b_j = 0; b_j < height; b_j += tx_height) {
+    for (int b_i = 0; b_i < width; b_i += tx_width) {
+      int sum = 0;
+      t_y_pix = y_pix;
+      for (int t_j = 0; t_j < tx_height; t_j++) {
+        for (int t_i = b_i; t_i < b_i + tx_width; t_i++) {
+          sum += t_y_pix[t_i];
+        }
+        t_y_pix += MAX_SB_SIZE;
+      }
+      averages[a++] = sum / num_pel;
     }
-    y_pix += MAX_SB_SIZE;
+    assert(a % stride == 0);
+    y_pix += block_row_stride;
   }
-  cfl->y_average = sum / num_pel;
+
+  cfl->y_averages_stride = stride;
+  assert(a <= MAX_NUM_TXB);
 }
 
 static INLINE double cfl_idx_to_alpha(int alpha_idx, CFL_SIGN_TYPE alpha_sign,
@@ -234,7 +251,12 @@
   const double alpha = cfl_idx_to_alpha(
       mbmi->cfl_alpha_idx, mbmi->cfl_alpha_signs[plane - 1], plane - 1);
 
-  const double avg = cfl->y_average;
+  const int avg_row =
+      (row << tx_size_wide_log2[0]) >> tx_size_wide_log2[tx_size];
+  const int avg_col =
+      (col << tx_size_high_log2[0]) >> tx_size_high_log2[tx_size];
+  const double avg =
+      cfl->y_averages[cfl->y_averages_stride * avg_row + avg_col];
 
   cfl_load(cfl, row, col, width, height);
   for (int j = 0; j < height; j++) {
@@ -348,7 +370,7 @@
   // Compute block-level DC_PRED for both chromatic planes.
   // DC_PRED replaces beta in the linear model.
   cfl_dc_pred(xd, plane_bsize);
-  // Compute block-level average on reconstructed luma input.
-  cfl_compute_average(cfl);
+  // Compute transform-level average on reconstructed luma input.
+  cfl_compute_averages(cfl, tx_size);
   cfl->are_parameters_computed = 1;
 }
commit	03678940ccd19ed6f9f3d9658785b7d9f08b39d8	[log] [tgz]
author	Luc Trudeau <luc@trud.ca>	Mon Jun 12 17:33:19 2017 -0400
committer	Luc Trudeau <luc@trud.ca>	Thu Jul 06 09:37:38 2017 -0400
tree	2c2c6f32b148bcbedf52e6926d17f835b106a543
parent	5c453db29e1a6645d3bef4e8de0b4ae23e0db4f8 [diff] [blame]