Allow insymmetric frame buffers for temporal filtering. This patch changes how frame buffers are chosen for temporal filtering. First, it allows temporal filtering to use different number of preceding and succeeding frames. This allows for the possibility of using more frames when the sequence is stable to better remove noise. Second, before this patch, noise level is used to determine additional frames to use for temporal filtering. The argument was that when noise is high, MV tends to get unreliable, and hence we should not use as many frames. However, this also is in contradiction with the intuition that when noise is high, we also need more frames to de-noise. This patch uses the frame-level correlation derived from first-pass stats to determine the number of frames used (how insymmetric can the frames be, relative to the to-be-filtered frame). The derived correlation is the correlation of the underlying random process without addtional noise, and therefore should measure the stablity of MVs better. Coding gains were observed: Speed1: avgPSNR ovrPSNR SSIM vmaf lowres -0.091 -0.198 -0.118 -0.686 midres -0.167 -0.251 -0.269 -0.361 ugc360p -0.169 -0.260 -0.358 -0.108 Speed4: avgPSNR ovrPSNR SSIM vmaf lowres -0.198 -0.323 -0.184 -0.655 midres -0.095 -0.178 -0.101 -0.143 ugc360p -0.223 -0.293 -0.440 -0.122 STATS_CHANGED Change-Id: I53edd0efacba949563dbce17c732c9d99e633cfe

commit: 34f4b38092630652a7a2ea716098042e059ddb79 [log] [tgz]
author: Bohan Li <bohanli@google.com> Tue Nov 10 10:20:08 2020 -0800
committer: Bohan Li <bohanli@google.com> Wed Nov 11 00:54:50 2020 +0000
tree: eccb5da32b4686fcc3aafa43d3ff10901a83760d
parent: 70f041ae050a635c01a88f6cab41bf0862ddeeb5 [diff]
diff --git a/av1/encoder/temporal_filter.c b/av1/encoder/temporal_filter.c
index 04e2d83..595630f 100644
--- a/av1/encoder/temporal_filter.c
+++ b/av1/encoder/temporal_filter.c

@@ -1071,24 +1071,36 @@
   }
   // Get quantization factor.
   const int q = get_q(cpi);
+  // Get correlation estimates from first-pass
+  RATE_CONTROL *rc = &cpi->rc;
+  const double *coeff = rc->cor_coeff;
+  const int offset = rc->regions_offset;
+  int cur_frame_idx = filter_frame_offset + rc->frames_since_key - offset;
+  if (rc->frames_since_key == 0) cur_frame_idx++;
 
-  // Adjust number of filtering frames based on noise and quantization factor.
-  // Basically, we would like to use more frames to filter low-noise frame such
-  // that the filtered frame can provide better predictions for more frames.
-  // Also, when the quantization factor is small enough (lossless compression),
-  // we will not change the number of frames for key frame filtering, which is
-  // to avoid visual quality drop.
-  int adjust_num = 0;
+  double accu_coeff0 = 1.0, accu_coeff1 = 1.0;
+  for (int i = 1; i <= max_after; i++) {
+    accu_coeff1 *= coeff[cur_frame_idx + i];
+  }
+  if (max_after >= 1) {
+    accu_coeff1 = pow(accu_coeff1, 1.0 / (double)max_after);
+  }
+  for (int i = 1; i <= max_before; i++) {
+    accu_coeff0 *= coeff[cur_frame_idx - i + 1];
+  }
+  if (max_before >= 1) {
+    accu_coeff0 = pow(accu_coeff0, 1.0 / (double)max_before);
+  }
+
+  // Adjust number of filtering frames based on quantization factor. When the
+  // quantization factor is small enough (lossless compression), we will not
+  // change the number of frames for key frame filtering, which is to avoid
+  // visual quality drop.
+  int adjust_num = 6;
   if (num_frames == 1) {  // `arnr_max_frames = 1` is used to disable filtering.
     adjust_num = 0;
   } else if (filter_frame_lookahead_idx < 0 && q <= 10) {
     adjust_num = 0;
-  } else if (noise_levels[0] < 0.5) {
-    adjust_num = 6;
-  } else if (noise_levels[0] < 1.0) {
-    adjust_num = 4;
-  } else if (noise_levels[0] < 2.0) {
-    adjust_num = 2;
   }
   num_frames = AOMMIN(num_frames + adjust_num, lookahead_depth + 1);
 
@@ -1104,8 +1116,29 @@
     num_frames += !(num_frames & 1);  // Make the number odd.
     // Only use 2 neighbours for the second ARF.
     if (is_second_arf) num_frames = AOMMIN(num_frames, 3);
-    num_before = AOMMIN(num_frames >> 1, max_before);
-    num_after = AOMMIN(num_frames >> 1, max_after);
+    if (AOMMIN(max_after, max_before) >= num_frames / 2) {
+      // just use half half
+      num_before = num_frames / 2;
+      num_after = num_frames / 2;
+    } else {
+      if (max_after < num_frames / 2) {
+        num_after = max_after;
+        num_before = AOMMIN(num_frames - 1 - num_after, max_before);
+      } else {
+        num_before = max_before;
+        num_after = AOMMIN(num_frames - 1 - num_before, max_after);
+      }
+      // Adjust insymmetry based on frame-level correlation
+      if (max_after > 0 && max_before > 0) {
+        if (num_after < num_before) {
+          const int insym = (int)(0.4 / AOMMAX(1 - accu_coeff1, 0.01));
+          num_before = AOMMIN(num_before, num_after + insym);
+        } else {
+          const int insym = (int)(0.4 / AOMMAX(1 - accu_coeff0, 0.01));
+          num_after = AOMMIN(num_after, num_before + insym);
+        }
+      }
+    }
   }
   num_frames = num_before + 1 + num_after;
commit	34f4b38092630652a7a2ea716098042e059ddb79	[log] [tgz]
author	Bohan Li <bohanli@google.com>	Tue Nov 10 10:20:08 2020 -0800
committer	Bohan Li <bohanli@google.com>	Wed Nov 11 00:54:50 2020 +0000
tree	eccb5da32b4686fcc3aafa43d3ff10901a83760d
parent	70f041ae050a635c01a88f6cab41bf0862ddeeb5 [diff]