av1/encoder/picklpf.c - aom - Git at Google

 /*
  * Copyright (c) 2016, Alliance for Open Media. All rights reserved
  *
  * This source code is subject to the terms of the BSD 2 Clause License and
  * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
  * was not distributed with this source code in the LICENSE file, you can
  * obtain it at www.aomedia.org/license/software. If the Alliance for Open
  * Media Patent License 1.0 was not distributed with this source code in the
  * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
  */

 #include <assert.h>
 #include <limits.h>

 #include "config/aom_scale_rtcd.h"

 #include "aom_dsp/aom_dsp_common.h"
 #include "aom_dsp/psnr.h"
 #include "aom_mem/aom_mem.h"
 #include "aom_ports/mem.h"

 #include "av1/common/av1_loopfilter.h"
 #include "av1/common/onyxc_int.h"
 #include "av1/common/quant_common.h"

 #include "av1/encoder/av1_quantize.h"
 #include "av1/encoder/encoder.h"
 #include "av1/encoder/picklpf.h"

 static void yv12_copy_plane(const YV12_BUFFER_CONFIG *src_bc,
                             YV12_BUFFER_CONFIG *dst_bc, int plane) {
   switch (plane) {
     case 0: aom_yv12_copy_y(src_bc, dst_bc); break;
     case 1: aom_yv12_copy_u(src_bc, dst_bc); break;
     case 2: aom_yv12_copy_v(src_bc, dst_bc); break;
     default: assert(plane >= 0 && plane <= 2); break;
   }
 }

 int av1_get_max_filter_level(const AV1_COMP *cpi) {
   if (cpi->oxcf.pass == 2) {
     return cpi->twopass.section_intra_rating > 8 ? MAX_LOOP_FILTER * 3 / 4
                                                  : MAX_LOOP_FILTER;
   } else {
     return MAX_LOOP_FILTER;
   }
 }

 static int64_t try_filter_frame(const YV12_BUFFER_CONFIG *sd,
                                 AV1_COMP *const cpi, int filt_level,
                                 int partial_frame, int plane, int dir) {
   AV1_COMMON *const cm = &cpi->common;
   int64_t filt_err;

   assert(plane >= 0 && plane <= 2);
   int filter_level[2] = { filt_level, filt_level };
   if (plane == 0 && dir == 0) filter_level[1] = cm->lf.filter_level[1];
   if (plane == 0 && dir == 1) filter_level[0] = cm->lf.filter_level[0];

   // set base filters for use of av1_get_filter_level when in DELTA_LF mode
   switch (plane) {
     case 0:
       cm->lf.filter_level[0] = filter_level[0];
       cm->lf.filter_level[1] = filter_level[1];
       break;
     case 1: cm->lf.filter_level_u = filter_level[0]; break;
     case 2: cm->lf.filter_level_v = filter_level[0]; break;
   }

   // TODO(any): please enable multi-thread and remove the flag when loop
   // filter mask is compatible with multi-thread.
   if (cpi->num_workers > 1)
     av1_loop_filter_frame_mt(&cm->cur_frame->buf, cm, &cpi->td.mb.e_mbd, plane,
                              plane + 1, partial_frame,
 #if CONFIG_LPF_MASK
                              0,
 #endif
                              cpi->workers, cpi->num_workers, &cpi->lf_row_sync);
   else
     av1_loop_filter_frame(&cm->cur_frame->buf, cm, &cpi->td.mb.e_mbd,
 #if CONFIG_LPF_MASK
                           0,
 #endif
                           plane, plane + 1, partial_frame);

   filt_err = aom_get_sse_plane(sd, &cm->cur_frame->buf, plane,
                                cm->seq_params.use_highbitdepth);

   // Re-instate the unfiltered frame
   yv12_copy_plane(&cpi->last_frame_uf, &cm->cur_frame->buf, plane);

   return filt_err;
 }

 static int search_filter_level(const YV12_BUFFER_CONFIG *sd, AV1_COMP *cpi,
                                int partial_frame,
                                const int *last_frame_filter_level,
                                double *best_cost_ret, int plane, int dir) {
   const AV1_COMMON *const cm = &cpi->common;
   const int min_filter_level = 0;
   const int max_filter_level = av1_get_max_filter_level(cpi);
   int filt_direction = 0;
   int64_t best_err;
   int filt_best;
   MACROBLOCK *x = &cpi->td.mb;

   // Start the search at the previous frame filter level unless it is now out of
   // range.
   int lvl;
   switch (plane) {
     case 0:
       switch (dir) {
         case 2:
           lvl = (last_frame_filter_level[0] + last_frame_filter_level[1] + 1) >>
                 1;
           break;
         case 0:
         case 1: lvl = last_frame_filter_level[dir]; break;
         default: assert(dir >= 0 && dir <= 2); return 0;
       }
       break;
     case 1: lvl = last_frame_filter_level[2]; break;
     case 2: lvl = last_frame_filter_level[3]; break;
     default: assert(plane >= 0 && plane <= 2); return 0;
   }
   int filt_mid = clamp(lvl, min_filter_level, max_filter_level);
   int filter_step = filt_mid < 16 ? 4 : filt_mid / 4;
   // Sum squared error at each filter level
   int64_t ss_err[MAX_LOOP_FILTER + 1];

   // Set each entry to -1
   memset(ss_err, 0xFF, sizeof(ss_err));
   yv12_copy_plane(&cm->cur_frame->buf, &cpi->last_frame_uf, plane);
   best_err = try_filter_frame(sd, cpi, filt_mid, partial_frame, plane, dir);
   filt_best = filt_mid;
   ss_err[filt_mid] = best_err;

   while (filter_step > 0) {
     const int filt_high = AOMMIN(filt_mid + filter_step, max_filter_level);
     const int filt_low = AOMMAX(filt_mid - filter_step, min_filter_level);

     // Bias against raising loop filter in favor of lowering it.
     int64_t bias = (best_err >> (15 - (filt_mid / 8))) * filter_step;

     if ((cpi->oxcf.pass == 2) && (cpi->twopass.section_intra_rating < 20))
       bias = (bias * cpi->twopass.section_intra_rating) / 20;

     // yx, bias less for large block size
     if (cm->tx_mode != ONLY_4X4) bias >>= 1;

     if (filt_direction <= 0 && filt_low != filt_mid) {
       // Get Low filter error score
       if (ss_err[filt_low] < 0) {
         ss_err[filt_low] =
             try_filter_frame(sd, cpi, filt_low, partial_frame, plane, dir);
       }
       // If value is close to the best so far then bias towards a lower loop
       // filter value.
       if (ss_err[filt_low] < (best_err + bias)) {
         // Was it actually better than the previous best?
         if (ss_err[filt_low] < best_err) {
           best_err = ss_err[filt_low];
         }
         filt_best = filt_low;
       }
     }

     // Now look at filt_high
     if (filt_direction >= 0 && filt_high != filt_mid) {
       if (ss_err[filt_high] < 0) {
         ss_err[filt_high] =
             try_filter_frame(sd, cpi, filt_high, partial_frame, plane, dir);
       }
       // If value is significantly better than previous best, bias added against
       // raising filter value
       if (ss_err[filt_high] < (best_err - bias)) {
         best_err = ss_err[filt_high];
         filt_best = filt_high;
       }
     }

     // Half the step distance if the best filter value was the same as last time
     if (filt_best == filt_mid) {
       filter_step /= 2;
       filt_direction = 0;
     } else {
       filt_direction = (filt_best < filt_mid) ? -1 : 1;
       filt_mid = filt_best;
     }
   }

   // Update best error
   best_err = ss_err[filt_best];

   if (best_cost_ret) *best_cost_ret = RDCOST_DBL(x->rdmult, 0, best_err);
   return filt_best;
 }

 void av1_pick_filter_level(const YV12_BUFFER_CONFIG *sd, AV1_COMP *cpi,
                            LPF_PICK_METHOD method) {
   AV1_COMMON *const cm = &cpi->common;
   const int num_planes = av1_num_planes(cm);
   struct loopfilter *const lf = &cm->lf;
   (void)sd;

   lf->sharpness_level = 0;
   cpi->td.mb.rdmult = cpi->rd.RDMULT;

   if (method == LPF_PICK_MINIMAL_LPF) {
     lf->filter_level[0] = 0;
     lf->filter_level[1] = 0;
   } else if (method >= LPF_PICK_FROM_Q) {
     const int min_filter_level = 0;
     const int max_filter_level = av1_get_max_filter_level(cpi);
     const int q = av1_ac_quant_Q3(cm->base_qindex, 0, cm->seq_params.bit_depth);
     // based on tests result for rtc test set
     // 0.04590 boosted or 0.02295 non-booseted in 18-bit fixed point
     const int strength_boost_q_treshold = 700;
     const int inter_frame_multiplier =
         q > strength_boost_q_treshold ? 12034 : 6017;
     // These values were determined by linear fitting the result of the
     // searched level for 8 bit depth:
     // Keyframes: filt_guess = q * 0.06699 - 1.60817
     // Other frames: filt_guess = q * inter_frame_multiplier + 2.48225
     //
     // And high bit depth separately:
     // filt_guess = q * 0.316206 + 3.87252
     int filt_guess;
     switch (cm->seq_params.bit_depth) {
       case AOM_BITS_8:
         filt_guess =
             (cm->current_frame.frame_type == KEY_FRAME)
                 ? ROUND_POWER_OF_TWO(q * 17563 - 421574, 18)
                 : ROUND_POWER_OF_TWO(q * inter_frame_multiplier + 650707, 18);
         break;
       case AOM_BITS_10:
         filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 4060632, 20);
         break;
       case AOM_BITS_12:
         filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 16242526, 22);
         break;
       default:
         assert(0 &&
                "bit_depth should be AOM_BITS_8, AOM_BITS_10 "
                "or AOM_BITS_12");
         return;
     }
     if (cm->seq_params.bit_depth != AOM_BITS_8 &&
         cm->current_frame.frame_type == KEY_FRAME)
       filt_guess -= 4;
     // TODO(chengchen): retrain the model for Y, U, V filter levels
     lf->filter_level[0] = clamp(filt_guess, min_filter_level, max_filter_level);
     lf->filter_level[1] = clamp(filt_guess, min_filter_level, max_filter_level);
     lf->filter_level_u = clamp(filt_guess, min_filter_level, max_filter_level);
     lf->filter_level_v = clamp(filt_guess, min_filter_level, max_filter_level);
   } else {
     const int last_frame_filter_level[4] = { lf->filter_level[0],
                                              lf->filter_level[1],
                                              lf->filter_level_u,
                                              lf->filter_level_v };

     lf->filter_level[0] = lf->filter_level[1] =
         search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
                             last_frame_filter_level, NULL, 0, 2);
     lf->filter_level[0] =
         search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
                             last_frame_filter_level, NULL, 0, 0);
     lf->filter_level[1] =
         search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
                             last_frame_filter_level, NULL, 0, 1);

     if (num_planes > 1) {
       lf->filter_level_u =
           search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
                               last_frame_filter_level, NULL, 1, 0);
       lf->filter_level_v =
           search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
                               last_frame_filter_level, NULL, 2, 0);
     }
   }
 }
	/*
	* Copyright (c) 2016, Alliance for Open Media. All rights reserved
	*
	* This source code is subject to the terms of the BSD 2 Clause License and
	* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
	* was not distributed with this source code in the LICENSE file, you can
	* obtain it at www.aomedia.org/license/software. If the Alliance for Open
	* Media Patent License 1.0 was not distributed with this source code in the
	* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
	*/

	#include <assert.h>
	#include <limits.h>

	#include "config/aom_scale_rtcd.h"

	#include "aom_dsp/aom_dsp_common.h"
	#include "aom_dsp/psnr.h"
	#include "aom_mem/aom_mem.h"
	#include "aom_ports/mem.h"

	#include "av1/common/av1_loopfilter.h"
	#include "av1/common/onyxc_int.h"
	#include "av1/common/quant_common.h"

	#include "av1/encoder/av1_quantize.h"
	#include "av1/encoder/encoder.h"
	#include "av1/encoder/picklpf.h"

	static void yv12_copy_plane(const YV12_BUFFER_CONFIG *src_bc,
	YV12_BUFFER_CONFIG *dst_bc, int plane) {
	switch (plane) {
	case 0: aom_yv12_copy_y(src_bc, dst_bc); break;
	case 1: aom_yv12_copy_u(src_bc, dst_bc); break;
	case 2: aom_yv12_copy_v(src_bc, dst_bc); break;
	default: assert(plane >= 0 && plane <= 2); break;
	}
	}

	int av1_get_max_filter_level(const AV1_COMP *cpi) {
	if (cpi->oxcf.pass == 2) {
	return cpi->twopass.section_intra_rating > 8 ? MAX_LOOP_FILTER * 3 / 4
	: MAX_LOOP_FILTER;
	} else {
	return MAX_LOOP_FILTER;
	}
	}

	static int64_t try_filter_frame(const YV12_BUFFER_CONFIG *sd,
	AV1_COMP *const cpi, int filt_level,
	int partial_frame, int plane, int dir) {
	AV1_COMMON *const cm = &cpi->common;
	int64_t filt_err;

	assert(plane >= 0 && plane <= 2);
	int filter_level[2] = { filt_level, filt_level };
	if (plane == 0 && dir == 0) filter_level[1] = cm->lf.filter_level[1];
	if (plane == 0 && dir == 1) filter_level[0] = cm->lf.filter_level[0];

	// set base filters for use of av1_get_filter_level when in DELTA_LF mode
	switch (plane) {
	case 0:
	cm->lf.filter_level[0] = filter_level[0];
	cm->lf.filter_level[1] = filter_level[1];
	break;
	case 1: cm->lf.filter_level_u = filter_level[0]; break;
	case 2: cm->lf.filter_level_v = filter_level[0]; break;
	}

	// TODO(any): please enable multi-thread and remove the flag when loop
	// filter mask is compatible with multi-thread.
	if (cpi->num_workers > 1)
	av1_loop_filter_frame_mt(&cm->cur_frame->buf, cm, &cpi->td.mb.e_mbd, plane,
	plane + 1, partial_frame,
	#if CONFIG_LPF_MASK
	0,
	#endif
	cpi->workers, cpi->num_workers, &cpi->lf_row_sync);
	else
	av1_loop_filter_frame(&cm->cur_frame->buf, cm, &cpi->td.mb.e_mbd,
	#if CONFIG_LPF_MASK
	0,
	#endif
	plane, plane + 1, partial_frame);

	filt_err = aom_get_sse_plane(sd, &cm->cur_frame->buf, plane,
	cm->seq_params.use_highbitdepth);

	// Re-instate the unfiltered frame
	yv12_copy_plane(&cpi->last_frame_uf, &cm->cur_frame->buf, plane);

	return filt_err;
	}

	static int search_filter_level(const YV12_BUFFER_CONFIG sd, AV1_COMP cpi,
	int partial_frame,
	const int *last_frame_filter_level,
	double *best_cost_ret, int plane, int dir) {
	const AV1_COMMON *const cm = &cpi->common;
	const int min_filter_level = 0;
	const int max_filter_level = av1_get_max_filter_level(cpi);
	int filt_direction = 0;
	int64_t best_err;
	int filt_best;
	MACROBLOCK *x = &cpi->td.mb;

	// Start the search at the previous frame filter level unless it is now out of
	// range.
	int lvl;
	switch (plane) {
	case 0:
	switch (dir) {
	case 2:
	lvl = (last_frame_filter_level[0] + last_frame_filter_level[1] + 1) >>
	1;
	break;
	case 0:
	case 1: lvl = last_frame_filter_level[dir]; break;
	default: assert(dir >= 0 && dir <= 2); return 0;
	}
	break;
	case 1: lvl = last_frame_filter_level[2]; break;
	case 2: lvl = last_frame_filter_level[3]; break;
	default: assert(plane >= 0 && plane <= 2); return 0;
	}
	int filt_mid = clamp(lvl, min_filter_level, max_filter_level);
	int filter_step = filt_mid < 16 ? 4 : filt_mid / 4;
	// Sum squared error at each filter level
	int64_t ss_err[MAX_LOOP_FILTER + 1];

	// Set each entry to -1
	memset(ss_err, 0xFF, sizeof(ss_err));
	yv12_copy_plane(&cm->cur_frame->buf, &cpi->last_frame_uf, plane);
	best_err = try_filter_frame(sd, cpi, filt_mid, partial_frame, plane, dir);
	filt_best = filt_mid;
	ss_err[filt_mid] = best_err;

	while (filter_step > 0) {
	const int filt_high = AOMMIN(filt_mid + filter_step, max_filter_level);
	const int filt_low = AOMMAX(filt_mid - filter_step, min_filter_level);

	// Bias against raising loop filter in favor of lowering it.
	int64_t bias = (best_err >> (15 - (filt_mid / 8))) * filter_step;

	if ((cpi->oxcf.pass == 2) && (cpi->twopass.section_intra_rating < 20))
	bias = (bias * cpi->twopass.section_intra_rating) / 20;

	// yx, bias less for large block size
	if (cm->tx_mode != ONLY_4X4) bias >>= 1;

	if (filt_direction <= 0 && filt_low != filt_mid) {
	// Get Low filter error score
	if (ss_err[filt_low] < 0) {
	ss_err[filt_low] =
	try_filter_frame(sd, cpi, filt_low, partial_frame, plane, dir);
	}
	// If value is close to the best so far then bias towards a lower loop
	// filter value.
	if (ss_err[filt_low] < (best_err + bias)) {
	// Was it actually better than the previous best?
	if (ss_err[filt_low] < best_err) {
	best_err = ss_err[filt_low];
	}
	filt_best = filt_low;
	}
	}

	// Now look at filt_high
	if (filt_direction >= 0 && filt_high != filt_mid) {
	if (ss_err[filt_high] < 0) {
	ss_err[filt_high] =
	try_filter_frame(sd, cpi, filt_high, partial_frame, plane, dir);
	}
	// If value is significantly better than previous best, bias added against
	// raising filter value
	if (ss_err[filt_high] < (best_err - bias)) {
	best_err = ss_err[filt_high];
	filt_best = filt_high;
	}
	}

	// Half the step distance if the best filter value was the same as last time
	if (filt_best == filt_mid) {
	filter_step /= 2;
	filt_direction = 0;
	} else {
	filt_direction = (filt_best < filt_mid) ? -1 : 1;
	filt_mid = filt_best;
	}
	}

	// Update best error
	best_err = ss_err[filt_best];

	if (best_cost_ret) *best_cost_ret = RDCOST_DBL(x->rdmult, 0, best_err);
	return filt_best;
	}

	void av1_pick_filter_level(const YV12_BUFFER_CONFIG sd, AV1_COMP cpi,
	LPF_PICK_METHOD method) {
	AV1_COMMON *const cm = &cpi->common;
	const int num_planes = av1_num_planes(cm);
	struct loopfilter *const lf = &cm->lf;
	(void)sd;

	lf->sharpness_level = 0;
	cpi->td.mb.rdmult = cpi->rd.RDMULT;

	if (method == LPF_PICK_MINIMAL_LPF) {
	lf->filter_level[0] = 0;
	lf->filter_level[1] = 0;
	} else if (method >= LPF_PICK_FROM_Q) {
	const int min_filter_level = 0;
	const int max_filter_level = av1_get_max_filter_level(cpi);
	const int q = av1_ac_quant_Q3(cm->base_qindex, 0, cm->seq_params.bit_depth);
	// based on tests result for rtc test set
	// 0.04590 boosted or 0.02295 non-booseted in 18-bit fixed point
	const int strength_boost_q_treshold = 700;
	const int inter_frame_multiplier =
	q > strength_boost_q_treshold ? 12034 : 6017;
	// These values were determined by linear fitting the result of the
	// searched level for 8 bit depth:
	// Keyframes: filt_guess = q * 0.06699 - 1.60817
	// Other frames: filt_guess = q * inter_frame_multiplier + 2.48225
	//
	// And high bit depth separately:
	// filt_guess = q * 0.316206 + 3.87252
	int filt_guess;
	switch (cm->seq_params.bit_depth) {
	case AOM_BITS_8:
	filt_guess =
	(cm->current_frame.frame_type == KEY_FRAME)
	? ROUND_POWER_OF_TWO(q * 17563 - 421574, 18)
	: ROUND_POWER_OF_TWO(q * inter_frame_multiplier + 650707, 18);
	break;
	case AOM_BITS_10:
	filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 4060632, 20);
	break;
	case AOM_BITS_12:
	filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 16242526, 22);
	break;
	default:
	assert(0 &&
	"bit_depth should be AOM_BITS_8, AOM_BITS_10 "
	"or AOM_BITS_12");
	return;
	}
	if (cm->seq_params.bit_depth != AOM_BITS_8 &&
	cm->current_frame.frame_type == KEY_FRAME)
	filt_guess -= 4;
	// TODO(chengchen): retrain the model for Y, U, V filter levels
	lf->filter_level[0] = clamp(filt_guess, min_filter_level, max_filter_level);
	lf->filter_level[1] = clamp(filt_guess, min_filter_level, max_filter_level);
	lf->filter_level_u = clamp(filt_guess, min_filter_level, max_filter_level);
	lf->filter_level_v = clamp(filt_guess, min_filter_level, max_filter_level);
	} else {
	const int last_frame_filter_level[4] = { lf->filter_level[0],
	lf->filter_level[1],
	lf->filter_level_u,
	lf->filter_level_v };

	lf->filter_level[0] = lf->filter_level[1] =
	search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
	last_frame_filter_level, NULL, 0, 2);
	lf->filter_level[0] =
	search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
	last_frame_filter_level, NULL, 0, 0);
	lf->filter_level[1] =
	search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
	last_frame_filter_level, NULL, 0, 1);

	if (num_planes > 1) {
	lf->filter_level_u =
	search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
	last_frame_filter_level, NULL, 1, 0);
	lf->filter_level_v =
	search_filter_level(sd, cpi, method == LPF_PICK_FROM_SUBIMAGE,
	last_frame_filter_level, NULL, 2, 0);
	}
	}
	}