blob: a5ad1a79636d97bb3d1f75995cf4abace99f925a [file] [log] [blame]
/*
* Copyright (c) 2016, Alliance for Open Media. All rights reserved
*
* This source code is subject to the terms of the BSD 2 Clause License and
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
* was not distributed with this source code in the LICENSE file, you can
* obtain it at www.aomedia.org/license/software. If the Alliance for Open
* Media Patent License 1.0 was not distributed with this source code in the
* PATENTS file, you can obtain it at www.aomedia.org/license/patent.
*/
#include <assert.h>
#include "aom_mem/aom_mem.h"
#include "aom_ports/mem.h"
#include "aom_scale/yv12config.h"
#include "av1/common/enums.h"
/****************************************************************************
* Exports
****************************************************************************/
/****************************************************************************
*
****************************************************************************/
#define yv12_align_addr(addr, align) \
(void *)(((size_t)(addr) + ((align)-1)) & (size_t) - (align))
// TODO(jkoleszar): Maybe replace this with struct aom_image
int aom_free_frame_buffer(YV12_BUFFER_CONFIG *ybf) {
if (ybf) {
if (ybf->buffer_alloc_sz > 0) {
aom_free(ybf->buffer_alloc);
}
if (ybf->y_buffer_8bit) aom_free(ybf->y_buffer_8bit);
/* buffer_alloc isn't accessed by most functions. Rather y_buffer,
u_buffer and v_buffer point to buffer_alloc and are used. Clear out
all of this so that a freed pointer isn't inadvertently used */
memset(ybf, 0, sizeof(YV12_BUFFER_CONFIG));
} else {
return -1;
}
return 0;
}
static int realloc_frame_buffer_aligned(
YV12_BUFFER_CONFIG *ybf, int width, int height, int ss_x, int ss_y,
int use_highbitdepth, int border, int byte_alignment,
aom_codec_frame_buffer_t *fb, aom_get_frame_buffer_cb_fn_t cb,
void *cb_priv, const int y_stride, const uint64_t yplane_size,
const uint64_t uvplane_size, const int aligned_width,
const int aligned_height, const int uv_width, const int uv_height,
const int uv_stride, const int uv_border_w, const int uv_border_h) {
if (ybf) {
const int aom_byte_align = (byte_alignment == 0) ? 1 : byte_alignment;
const uint64_t frame_size =
(1 + use_highbitdepth) * (yplane_size + 2 * uvplane_size);
uint8_t *buf = NULL;
#if defined AOM_MAX_ALLOCABLE_MEMORY
// The size of ybf->buffer_alloc.
uint64_t alloc_size = frame_size;
// The size of ybf->y_buffer_8bit.
if (use_highbitdepth) alloc_size += yplane_size;
// The decoder may allocate REF_FRAMES frame buffers in the frame buffer
// pool. Bound the total amount of allocated memory as if these REF_FRAMES
// frame buffers were allocated in a single allocation.
if (alloc_size > AOM_MAX_ALLOCABLE_MEMORY / REF_FRAMES) return -1;
#endif
if (cb != NULL) {
const int align_addr_extra_size = 31;
const uint64_t external_frame_size = frame_size + align_addr_extra_size;
assert(fb != NULL);
if (external_frame_size != (size_t)external_frame_size) return -1;
// Allocation to hold larger frame, or first allocation.
if (cb(cb_priv, (size_t)external_frame_size, fb) < 0) return -1;
if (fb->data == NULL || fb->size < external_frame_size) return -1;
ybf->buffer_alloc = (uint8_t *)yv12_align_addr(fb->data, 32);
#if defined(__has_feature)
#if __has_feature(memory_sanitizer)
// This memset is needed for fixing the issue of using uninitialized
// value in msan test. It will cause a perf loss, so only do this for
// msan test.
memset(ybf->buffer_alloc, 0, (size_t)frame_size);
#endif
#endif
} else if (frame_size > ybf->buffer_alloc_sz) {
// Allocation to hold larger frame, or first allocation.
aom_free(ybf->buffer_alloc);
ybf->buffer_alloc = NULL;
ybf->buffer_alloc_sz = 0;
if (frame_size != (size_t)frame_size) return -1;
ybf->buffer_alloc = (uint8_t *)aom_memalign(32, (size_t)frame_size);
if (!ybf->buffer_alloc) return -1;
ybf->buffer_alloc_sz = (size_t)frame_size;
// This memset is needed for fixing valgrind error from C loop filter
// due to access uninitialized memory in frame border. It could be
// removed if border is totally removed.
memset(ybf->buffer_alloc, 0, ybf->buffer_alloc_sz);
}
ybf->y_crop_width = width;
ybf->y_crop_height = height;
ybf->y_width = aligned_width;
ybf->y_height = aligned_height;
ybf->y_stride = y_stride;
ybf->uv_crop_width = (width + ss_x) >> ss_x;
ybf->uv_crop_height = (height + ss_y) >> ss_y;
ybf->uv_width = uv_width;
ybf->uv_height = uv_height;
ybf->uv_stride = uv_stride;
ybf->border = border;
ybf->frame_size = (size_t)frame_size;
ybf->subsampling_x = ss_x;
ybf->subsampling_y = ss_y;
buf = ybf->buffer_alloc;
if (use_highbitdepth) {
// Store uint16 addresses when using 16bit framebuffers
buf = CONVERT_TO_BYTEPTR(ybf->buffer_alloc);
ybf->flags = YV12_FLAG_HIGHBITDEPTH;
} else {
ybf->flags = 0;
}
ybf->y_buffer = (uint8_t *)yv12_align_addr(
buf + (border * y_stride) + border, aom_byte_align);
ybf->u_buffer = (uint8_t *)yv12_align_addr(
buf + yplane_size + (uv_border_h * uv_stride) + uv_border_w,
aom_byte_align);
ybf->v_buffer =
(uint8_t *)yv12_align_addr(buf + yplane_size + uvplane_size +
(uv_border_h * uv_stride) + uv_border_w,
aom_byte_align);
ybf->use_external_reference_buffers = 0;
if (use_highbitdepth) {
if (ybf->y_buffer_8bit) aom_free(ybf->y_buffer_8bit);
ybf->y_buffer_8bit = (uint8_t *)aom_memalign(32, (size_t)yplane_size);
if (!ybf->y_buffer_8bit) return -1;
} else {
if (ybf->y_buffer_8bit) {
aom_free(ybf->y_buffer_8bit);
ybf->y_buffer_8bit = NULL;
ybf->buf_8bit_valid = 0;
}
}
ybf->corrupted = 0; /* assume not corrupted by errors */
return 0;
}
return -2;
}
static int calc_stride_and_planesize(const int ss_x, const int ss_y,
const int aligned_width,
const int aligned_height, const int border,
const int byte_alignment, int *y_stride,
int *uv_stride, uint64_t *yplane_size,
uint64_t *uvplane_size,
const int uv_height) {
/* Only support allocating buffers that have a border that's a multiple
* of 32. The border restriction is required to get 16-byte alignment of
* the start of the chroma rows without introducing an arbitrary gap
* between planes, which would break the semantics of things like
* aom_img_set_rect(). */
if (border & 0x1f) return -3;
*y_stride = ((aligned_width + 2 * border) + 31) & ~31;
*yplane_size =
(aligned_height + 2 * border) * (uint64_t)(*y_stride) + byte_alignment;
*uv_stride = *y_stride >> ss_x;
*uvplane_size = (uv_height + 2 * (border >> ss_y)) * (uint64_t)(*uv_stride) +
byte_alignment;
return 0;
}
int aom_realloc_frame_buffer(YV12_BUFFER_CONFIG *ybf, int width, int height,
int ss_x, int ss_y, int use_highbitdepth,
int border, int byte_alignment,
aom_codec_frame_buffer_t *fb,
aom_get_frame_buffer_cb_fn_t cb, void *cb_priv) {
#if CONFIG_SIZE_LIMIT
if (width > DECODE_WIDTH_LIMIT || height > DECODE_HEIGHT_LIMIT) return -1;
#endif
if (ybf) {
int y_stride = 0;
int uv_stride = 0;
uint64_t yplane_size = 0;
uint64_t uvplane_size = 0;
const int aligned_width = (width + 7) & ~7;
const int aligned_height = (height + 7) & ~7;
const int uv_width = aligned_width >> ss_x;
const int uv_height = aligned_height >> ss_y;
const int uv_border_w = border >> ss_x;
const int uv_border_h = border >> ss_y;
int error = calc_stride_and_planesize(
ss_x, ss_y, aligned_width, aligned_height, border, byte_alignment,
&y_stride, &uv_stride, &yplane_size, &uvplane_size, uv_height);
if (error) return error;
return realloc_frame_buffer_aligned(
ybf, width, height, ss_x, ss_y, use_highbitdepth, border,
byte_alignment, fb, cb, cb_priv, y_stride, yplane_size, uvplane_size,
aligned_width, aligned_height, uv_width, uv_height, uv_stride,
uv_border_w, uv_border_h);
}
return -2;
}
// TODO(anyone): This function allocates memory for
// lookahead buffer considering height and width is
// aligned to 128. Currently variance calculation of
// simple_motion_search_get_best_ref() function is done
// for full sb size (i.e integral multiple of max sb
// size = 128 or 64). Hence partial sbs need up to 127
// pixels beyond frame boundary. 128 aligned limitation of
// lookahead buffer can be removed if variance calculation
// is adjusted for partial sbs
// NOTE: Chroma width and height need not be aligned to
// 128 since variance calculation happens only for luma plane
int aom_realloc_lookahead_buffer(YV12_BUFFER_CONFIG *ybf, int width, int height,
int ss_x, int ss_y, int use_highbitdepth,
int border, int byte_alignment,
aom_codec_frame_buffer_t *fb,
aom_get_frame_buffer_cb_fn_t cb,
void *cb_priv) {
if (ybf) {
int y_stride = 0;
int uv_stride = 0;
uint64_t yplane_size = 0;
uint64_t uvplane_size = 0;
const int aligned_128_width = (width + 127) & ~127;
const int aligned_128_height = (height + 127) & ~127;
const int aligned_width = (width + 7) & ~7;
const int aligned_height = (height + 7) & ~7;
const int uv_64_height = aligned_128_height >> ss_y;
const int uv_width = aligned_width >> ss_x;
const int uv_height = aligned_height >> ss_y;
const int uv_border_w = border >> ss_x;
const int uv_border_h = border >> ss_y;
int error = calc_stride_and_planesize(
ss_x, ss_y, aligned_128_width, aligned_128_height, border,
byte_alignment, &y_stride, &uv_stride, &yplane_size, &uvplane_size,
uv_64_height);
if (error) return error;
return realloc_frame_buffer_aligned(
ybf, width, height, ss_x, ss_y, use_highbitdepth, border,
byte_alignment, fb, cb, cb_priv, y_stride, yplane_size, uvplane_size,
aligned_width, aligned_height, uv_width, uv_height, uv_stride,
uv_border_w, uv_border_h);
}
return -2;
}
int aom_alloc_frame_buffer(YV12_BUFFER_CONFIG *ybf, int width, int height,
int ss_x, int ss_y, int use_highbitdepth, int border,
int byte_alignment) {
if (ybf) {
aom_free_frame_buffer(ybf);
return aom_realloc_frame_buffer(ybf, width, height, ss_x, ss_y,
use_highbitdepth, border, byte_alignment,
NULL, NULL, NULL);
}
return -2;
}