/***************************************************************************** * This file is part of Kvazaar HEVC encoder. * * Copyright (C) 2013-2015 Tampere University of Technology and others (see * COPYING file). * * Kvazaar is free software: you can redistribute it and/or modify it under * the terms of the GNU Lesser General Public License as published by the * Free Software Foundation; either version 2.1 of the License, or (at your * option) any later version. * * Kvazaar is distributed in the hope that it will be useful, but WITHOUT ANY * WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS * FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for * more details. * * You should have received a copy of the GNU General Public License along * with Kvazaar. If not, see . ****************************************************************************/ #include #include #include "cu.h" #include "threads.h" /** * \brief Number of PUs in a CU. * * Indexed by part_mode_t values. */ const uint8_t kvz_part_mode_num_parts[] = { 1, // 2Nx2N 2, // 2NxN 2, // Nx2N 4, // NxN 2, // 2NxnU 2, // 2NxnD 2, // nLx2N 2, // nRx2N }; /** * \brief PU offsets. * * Indexed by [part mode][PU number][axis]. * * Units are 1/4 of the width of the CU. */ const uint8_t kvz_part_mode_offsets[][4][2] = { { {0, 0} }, // 2Nx2N { {0, 0}, {0, 2} }, // 2NxN { {0, 0}, {2, 0} }, // Nx2N { {0, 0}, {2, 0}, {0, 2}, {2, 2} }, // NxN { {0, 0}, {0, 1} }, // 2NxnU { {0, 0}, {0, 3} }, // 2NxnD { {0, 0}, {1, 0} }, // nLx2N { {0, 0}, {3, 0} }, // nRx2N }; /** * \brief PU sizes. * * Indexed by [part mode][PU number][axis]. * * Units are 1/4 of the width of the CU. */ const uint8_t kvz_part_mode_sizes[][4][2] = { { {4, 4} }, // 2Nx2N { {4, 2}, {4, 2} }, // 2NxN { {2, 4}, {2, 4} }, // Nx2N { {2, 2}, {2, 2}, {2, 2}, {2, 2} }, // NxN { {4, 1}, {4, 3} }, // 2NxnU { {4, 3}, {4, 1} }, // 2NxnD { {1, 4}, {3, 4} }, // nLx2N { {3, 4}, {1, 4} }, // nRx2N }; #define BLIT_COEFF_CASE(n) case n:\ for (y = 0; y < n; ++y) {\ memcpy(&dst[y*dst_stride], &orig[y*orig_stride], n * sizeof(coeff_t));\ }\ break; void kvz_coefficients_blit(const coeff_t * const orig, coeff_t * const dst, const unsigned width, const unsigned height, const unsigned orig_stride, const unsigned dst_stride) { unsigned y; int nxn_width = (width == height) ? width : 0; switch (nxn_width) { BLIT_COEFF_CASE(4) BLIT_COEFF_CASE(8) BLIT_COEFF_CASE(16) BLIT_COEFF_CASE(32) BLIT_COEFF_CASE(64) default: for (y = 0; y < height; ++y) { memcpy(&dst[y*dst_stride], &orig[y*orig_stride], width * sizeof(coeff_t)); } break; } } unsigned kvz_coefficients_calc_abs(const coeff_t *const buf, const int buf_stride, const int width) { int sum = 0; int y, x; for (y = 0; y < width; ++y) { for (x = 0; x < width; ++x) { sum += abs(buf[x + y * buf_stride]); } } return sum; } cu_info_t* kvz_cu_array_at(cu_array_t *cua, unsigned x_px, unsigned y_px) { return (cu_info_t*) kvz_cu_array_at_const(cua, x_px, y_px); } const cu_info_t* kvz_cu_array_at_const(const cu_array_t *cua, unsigned x_px, unsigned y_px) { assert(x_px < cua->width); assert(y_px < cua->height); return &(cua)->data[(x_px >> 2) + (y_px >> 2) * ((cua)->width >> 2)]; } /** * \brief Allocate a CU array. * * \param width width of the array in luma pixels * \param height height of the array in luma pixels */ cu_array_t * kvz_cu_array_alloc(const int width, const int height) { cu_array_t *cua = MALLOC(cu_array_t, 1); // Round up to a multiple of cell width and divide by cell width. const int width_scu = (width + 15) >> 2; const int height_scu = (height + 15) >> 2; assert(width_scu * 16 >= width); assert(height_scu * 16 >= height); const unsigned cu_array_size = width_scu * height_scu; cua->data = calloc(cu_array_size, sizeof(cu_info_t)); cua->width = width_scu << 2; cua->height = height_scu << 2; cua->refcount = 1; return cua; } int kvz_cu_array_free(cu_array_t * const cua) { int32_t new_refcount; if (!cua) return 1; new_refcount = KVZ_ATOMIC_DEC(&(cua->refcount)); //Still we have some references, do nothing if (new_refcount > 0) return 1; FREE_POINTER(cua->data); free(cua); return 1; } /** * \brief Copy part of a cu array to another cu array. * * All values are in luma pixels. * * \param dst destination array * \param dst_x x-coordinate of the left edge of the copied area in dst * \param dst_y y-coordinate of the top edge of the copied area in dst * \param src source array * \param src_x x-coordinate of the left edge of the copied area in src * \param src_y y-coordinate of the top edge of the copied area in src * \param width width of the area to copy * \param height height of the area to copy */ void kvz_cu_array_copy(cu_array_t* dst, int dst_x, int dst_y, const cu_array_t* src, int src_x, int src_y, int width, int height) { // Convert values from pixel coordinates to array indices. int src_stride = src->width >> 2; int dst_stride = dst->width >> 2; const cu_info_t* src_ptr = &src->data[(src_x >> 2) + (src_y >> 2) * src_stride]; cu_info_t* dst_ptr = &dst->data[(dst_x >> 2) + (dst_y >> 2) * dst_stride]; // Number of bytes to copy per row. const size_t row_size = sizeof(cu_info_t) * (width >> 2); width = MIN(width, MIN(src->width - src_x, dst->width - dst_x)); height = MIN(height, MIN(src->height - src_y, dst->height - dst_y)); assert(src_x + width <= src->width); assert(src_y + height <= src->height); assert(dst_x + width <= dst->width); assert(dst_y + height <= dst->height); for (int i = 0; i < (height >> 2); ++i) { memcpy(dst_ptr, src_ptr, row_size); src_ptr += src_stride; dst_ptr += dst_stride; } } /** * \brief Copy an lcu to a cu array. * * All values are in luma pixels. * * \param dst destination array * \param dst_x x-coordinate of the left edge of the copied area in dst * \param dst_y y-coordinate of the top edge of the copied area in dst * \param src source lcu */ void kvz_cu_array_copy_from_lcu(cu_array_t* dst, int dst_x, int dst_y, const lcu_t *src) { // Convert values from pixel coordinates to array indices. const int dst_x_scu = dst_x >> 2; const int dst_y_scu = dst_y >> 2; const int dst_stride = dst->width >> 2; for (int y = 0; y < LCU_CU_WIDTH; ++y) { for (int x = 0; x < LCU_CU_WIDTH; ++x) { const cu_info_t *from_cu = LCU_GET_CU(src, x, y); cu_info_t *to_cu = &dst->data[dst_x_scu + x * 2 + (dst_y_scu + y * 2) * dst_stride]; memcpy(to_cu, from_cu, sizeof(*to_cu)); memcpy(to_cu + 1, from_cu, sizeof(*to_cu)); memcpy(to_cu + dst_stride, from_cu, sizeof(*to_cu)); memcpy(to_cu + dst_stride + 1, from_cu, sizeof(*to_cu)); } } }