mirror of
https://github.com/ultravideo/uvg266.git
synced 2024-11-24 10:34:05 +00:00
dc6b2024ea
Changes asserts on the reference count of objects to assert the value after KVZ_ATOMIC_INC instead of directly checking the value. Fixes some data races detected by TSan.
218 lines
5.9 KiB
C
218 lines
5.9 KiB
C
/*****************************************************************************
|
|
* This file is part of Kvazaar HEVC encoder.
|
|
*
|
|
* Copyright (C) 2013-2015 Tampere University of Technology and others (see
|
|
* COPYING file).
|
|
*
|
|
* Kvazaar is free software: you can redistribute it and/or modify it under
|
|
* the terms of the GNU Lesser General Public License as published by the
|
|
* Free Software Foundation; either version 2.1 of the License, or (at your
|
|
* option) any later version.
|
|
*
|
|
* Kvazaar is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
* FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for
|
|
* more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with Kvazaar. If not, see <http://www.gnu.org/licenses/>.
|
|
****************************************************************************/
|
|
|
|
#include <string.h>
|
|
#include <stdlib.h>
|
|
|
|
#include "cu.h"
|
|
#include "threads.h"
|
|
|
|
|
|
/**
|
|
* \brief Number of PUs in a CU.
|
|
*
|
|
* Indexed by part_mode_t values.
|
|
*/
|
|
const uint8_t kvz_part_mode_num_parts[] = {
|
|
1, // 2Nx2N
|
|
2, // 2NxN
|
|
2, // Nx2N
|
|
4, // NxN
|
|
2, // 2NxnU
|
|
2, // 2NxnD
|
|
2, // nLx2N
|
|
2, // nRx2N
|
|
};
|
|
|
|
/**
|
|
* \brief PU offsets.
|
|
*
|
|
* Indexed by [part mode][PU number][axis].
|
|
*
|
|
* Units are 1/4 of the width of the CU.
|
|
*/
|
|
const uint8_t kvz_part_mode_offsets[][4][2] = {
|
|
{ {0, 0} }, // 2Nx2N
|
|
{ {0, 0}, {0, 2} }, // 2NxN
|
|
{ {0, 0}, {2, 0} }, // Nx2N
|
|
{ {0, 0}, {2, 0}, {0, 2}, {2, 2} }, // NxN
|
|
{ {0, 0}, {0, 1} }, // 2NxnU
|
|
{ {0, 0}, {0, 3} }, // 2NxnD
|
|
{ {0, 0}, {1, 0} }, // nLx2N
|
|
{ {0, 0}, {3, 0} }, // nRx2N
|
|
};
|
|
|
|
/**
|
|
* \brief PU sizes.
|
|
*
|
|
* Indexed by [part mode][PU number][axis].
|
|
*
|
|
* Units are 1/4 of the width of the CU.
|
|
*/
|
|
const uint8_t kvz_part_mode_sizes[][4][2] = {
|
|
{ {4, 4} }, // 2Nx2N
|
|
{ {4, 2}, {4, 2} }, // 2NxN
|
|
{ {2, 4}, {2, 4} }, // Nx2N
|
|
{ {2, 2}, {2, 2}, {2, 2}, {2, 2} }, // NxN
|
|
{ {4, 1}, {4, 3} }, // 2NxnU
|
|
{ {4, 3}, {4, 1} }, // 2NxnD
|
|
{ {1, 4}, {3, 4} }, // nLx2N
|
|
{ {3, 4}, {1, 4} }, // nRx2N
|
|
};
|
|
|
|
|
|
cu_info_t* kvz_cu_array_at(cu_array_t *cua, unsigned x_px, unsigned y_px)
|
|
{
|
|
return (cu_info_t*) kvz_cu_array_at_const(cua, x_px, y_px);
|
|
}
|
|
|
|
|
|
const cu_info_t* kvz_cu_array_at_const(const cu_array_t *cua, unsigned x_px, unsigned y_px)
|
|
{
|
|
assert(x_px < cua->width);
|
|
assert(y_px < cua->height);
|
|
return &(cua)->data[(x_px >> 2) + (y_px >> 2) * ((cua)->stride >> 2)];
|
|
}
|
|
|
|
|
|
/**
|
|
* \brief Allocate a CU array.
|
|
*
|
|
* \param width width of the array in luma pixels
|
|
* \param height height of the array in luma pixels
|
|
*/
|
|
cu_array_t * kvz_cu_array_alloc(const int width, const int height)
|
|
{
|
|
cu_array_t *cua = MALLOC(cu_array_t, 1);
|
|
|
|
// Round up to a multiple of LCU width and divide by cell width.
|
|
const int width_scu = CEILDIV(width, LCU_WIDTH) * LCU_WIDTH / SCU_WIDTH;
|
|
const int height_scu = CEILDIV(height, LCU_WIDTH) * LCU_WIDTH / SCU_WIDTH;
|
|
const unsigned cu_array_size = width_scu * height_scu;
|
|
|
|
cua->base = NULL;
|
|
cua->data = calloc(cu_array_size, sizeof(cu_info_t));
|
|
cua->width = width_scu * SCU_WIDTH;
|
|
cua->height = height_scu * SCU_WIDTH;
|
|
cua->stride = cua->width;
|
|
cua->refcount = 1;
|
|
|
|
return cua;
|
|
}
|
|
|
|
|
|
cu_array_t * kvz_cu_subarray(cu_array_t *base,
|
|
const unsigned x_offset,
|
|
const unsigned y_offset,
|
|
const unsigned width,
|
|
const unsigned height)
|
|
{
|
|
assert(x_offset + width <= base->width);
|
|
assert(y_offset + height <= base->height);
|
|
|
|
if (x_offset == 0 &&
|
|
y_offset == 0 &&
|
|
width == base->width &&
|
|
height == base->height)
|
|
{
|
|
return kvz_cu_array_copy_ref(base);
|
|
}
|
|
|
|
cu_array_t *cua = MALLOC(cu_array_t, 1);
|
|
|
|
// Find the real base array.
|
|
cu_array_t *real_base = base;
|
|
while (real_base->base) {
|
|
real_base = real_base->base;
|
|
}
|
|
cua->base = kvz_cu_array_copy_ref(real_base);
|
|
cua->data = kvz_cu_array_at(base, x_offset, y_offset);
|
|
cua->width = width;
|
|
cua->height = height;
|
|
cua->stride = base->stride;
|
|
cua->refcount = 1;
|
|
|
|
return cua;
|
|
}
|
|
|
|
void kvz_cu_array_free(cu_array_t **cua_ptr)
|
|
{
|
|
cu_array_t *cua = *cua_ptr;
|
|
if (cua == NULL) return;
|
|
*cua_ptr = NULL;
|
|
|
|
int new_refcount = KVZ_ATOMIC_DEC(&cua->refcount);
|
|
if (new_refcount > 0) {
|
|
// Still we have some references, do nothing.
|
|
return;
|
|
}
|
|
|
|
assert(new_refcount == 0);
|
|
|
|
if (!cua->base) {
|
|
FREE_POINTER(cua->data);
|
|
} else {
|
|
kvz_cu_array_free(&cua->base);
|
|
cua->data = NULL;
|
|
}
|
|
|
|
FREE_POINTER(cua);
|
|
}
|
|
|
|
|
|
/**
|
|
* \brief Get a new pointer to a cu array.
|
|
*
|
|
* Increment reference count and return the cu array.
|
|
*/
|
|
cu_array_t * kvz_cu_array_copy_ref(cu_array_t* cua)
|
|
{
|
|
int32_t new_refcount = KVZ_ATOMIC_INC(&cua->refcount);
|
|
// The caller should have had another reference and we added one
|
|
// reference so refcount should be at least 2.
|
|
assert(new_refcount >= 2);
|
|
return cua;
|
|
}
|
|
|
|
|
|
/**
|
|
* \brief Copy an lcu to a cu array.
|
|
*
|
|
* All values are in luma pixels.
|
|
*
|
|
* \param dst destination array
|
|
* \param dst_x x-coordinate of the left edge of the copied area in dst
|
|
* \param dst_y y-coordinate of the top edge of the copied area in dst
|
|
* \param src source lcu
|
|
*/
|
|
void kvz_cu_array_copy_from_lcu(cu_array_t* dst, int dst_x, int dst_y, const lcu_t *src)
|
|
{
|
|
const int dst_stride = dst->stride >> 2;
|
|
for (int y = 0; y < LCU_WIDTH; y += SCU_WIDTH) {
|
|
for (int x = 0; x < LCU_WIDTH; x += SCU_WIDTH) {
|
|
const cu_info_t *from_cu = LCU_GET_CU_AT_PX(src, x, y);
|
|
const int x_scu = (dst_x + x) >> 2;
|
|
const int y_scu = (dst_y + y) >> 2;
|
|
cu_info_t *to_cu = &dst->data[x_scu + y_scu * dst_stride];
|
|
memcpy(to_cu, from_cu, sizeof(*to_cu));
|
|
}
|
|
}
|
|
}
|