blob: 639c25cbfe763755d0cda37176662dc14b0643c2 [file] [log] [blame]
/*
* Copyright (c) 2021, Alliance for Open Media. All rights reserved
*
* This source code is subject to the terms of the BSD 3-Clause Clear License and the
* Alliance for Open Media Patent License 1.0. If the BSD 3-Clause Clear License was
* not distributed with this source code in the LICENSE file, you can obtain it
* at aomedia.org/license/software-license/bsd-3-c-c/. If the Alliance for Open Media Patent
* License 1.0 was not distributed with this source code in the PATENTS file, you
* can obtain it at aomedia.org/license/patent-license/.
*/
#include <assert.h>
#include "config/aom_config.h"
#include "aom_scale/yv12config.h"
#include "aom_mem/aom_mem.h"
#include "aom_scale/aom_scale.h"
#if HAVE_DSPR2
static void extend_plane(uint8_t *const src, int src_stride, int width,
int height, int extend_top, int extend_left,
int extend_bottom, int extend_right) {
int i, j;
uint8_t *left_src, *right_src;
uint8_t *left_dst_start, *right_dst_start;
uint8_t *left_dst, *right_dst;
uint8_t *top_src, *bot_src;
uint8_t *top_dst, *bot_dst;
uint32_t left_pix;
uint32_t right_pix;
uint32_t linesize;
/* copy the left and right most columns out */
left_src = src;
right_src = src + width - 1;
left_dst_start = src - extend_left;
right_dst_start = src + width;
for (i = height; i--;) {
left_dst = left_dst_start;
right_dst = right_dst_start;
__asm__ __volatile__(
"lb %[left_pix], 0(%[left_src]) \n\t"
"lb %[right_pix], 0(%[right_src]) \n\t"
"replv.qb %[left_pix], %[left_pix] \n\t"
"replv.qb %[right_pix], %[right_pix] \n\t"
: [left_pix] "=&r"(left_pix), [right_pix] "=&r"(right_pix)
: [left_src] "r"(left_src), [right_src] "r"(right_src));
for (j = extend_left / 4; j--;) {
__asm__ __volatile__(
"sw %[left_pix], 0(%[left_dst]) \n\t"
"sw %[right_pix], 0(%[right_dst]) \n\t"
:
: [left_dst] "r"(left_dst), [left_pix] "r"(left_pix),
[right_dst] "r"(right_dst), [right_pix] "r"(right_pix));
left_dst += 4;
right_dst += 4;
}
for (j = extend_left % 4; j--;) {
__asm__ __volatile__(
"sb %[left_pix], 0(%[left_dst]) \n\t"
"sb %[right_pix], 0(%[right_dst]) \n\t"
:
: [left_dst] "r"(left_dst), [left_pix] "r"(left_pix),
[right_dst] "r"(right_dst), [right_pix] "r"(right_pix));
left_dst += 1;
right_dst += 1;
}
left_src += src_stride;
right_src += src_stride;
left_dst_start += src_stride;
right_dst_start += src_stride;
}
/* Now copy the top and bottom lines into each line of the respective
* borders
*/
top_src = src - extend_left;
bot_src = src + src_stride * (height - 1) - extend_left;
top_dst = src + src_stride * (-extend_top) - extend_left;
bot_dst = src + src_stride * (height)-extend_left;
linesize = extend_left + extend_right + width;
for (i = 0; i < extend_top; i++) {
memcpy(top_dst, top_src, linesize);
top_dst += src_stride;
}
for (i = 0; i < extend_bottom; i++) {
memcpy(bot_dst, bot_src, linesize);
bot_dst += src_stride;
}
}
static void extend_frame(YV12_BUFFER_CONFIG *const ybf, int ext_size) {
const int c_w = ybf->uv_crop_width;
const int c_h = ybf->uv_crop_height;
const int ss_x = ybf->uv_width < ybf->y_width;
const int ss_y = ybf->uv_height < ybf->y_height;
const int c_et = ext_size >> ss_y;
const int c_el = ext_size >> ss_x;
const int c_eb = c_et + ybf->uv_height - ybf->uv_crop_height;
const int c_er = c_el + ybf->uv_width - ybf->uv_crop_width;
assert(ybf->y_height - ybf->y_crop_height < 16);
assert(ybf->y_width - ybf->y_crop_width < 16);
assert(ybf->y_height - ybf->y_crop_height >= 0);
assert(ybf->y_width - ybf->y_crop_width >= 0);
extend_plane(ybf->y_buffer, ybf->y_stride, ybf->y_crop_width,
ybf->y_crop_height, ext_size, ext_size,
ext_size + ybf->y_height - ybf->y_crop_height,
ext_size + ybf->y_width - ybf->y_crop_width);
extend_plane(ybf->u_buffer, ybf->uv_stride, c_w, c_h, c_et, c_el, c_eb, c_er);
extend_plane(ybf->v_buffer, ybf->uv_stride, c_w, c_h, c_et, c_el, c_eb, c_er);
}
void aom_extend_frame_borders_dspr2(YV12_BUFFER_CONFIG *ybf,
const int num_planes) {
extend_frame(ybf, ybf->border, num_planes);
}
void aom_extend_frame_inner_borders_dspr2(YV12_BUFFER_CONFIG *ybf,
const int num_planes) {
const int inner_bw = (ybf->border > AOMINNERBORDERINPIXELS)
? AOMINNERBORDERINPIXELS
: ybf->border;
extend_frame(ybf, inner_bw, num_planes);
}
#endif