2014-01-24 10:37:15 +00:00
|
|
|
/*****************************************************************************
|
|
|
|
* This file is part of Kvazaar HEVC encoder.
|
2014-02-21 13:00:20 +00:00
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* Copyright (C) 2013-2015 Tampere University of Technology and others (see
|
2014-01-24 10:37:15 +00:00
|
|
|
* COPYING file).
|
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* Kvazaar is free software: you can redistribute it and/or modify it under
|
|
|
|
* the terms of the GNU Lesser General Public License as published by the
|
|
|
|
* Free Software Foundation; either version 2.1 of the License, or (at your
|
|
|
|
* option) any later version.
|
2014-01-24 10:37:15 +00:00
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* Kvazaar is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
|
|
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
|
|
* FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for
|
|
|
|
* more details.
|
2014-01-24 10:37:15 +00:00
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* You should have received a copy of the GNU General Public License along
|
|
|
|
* with Kvazaar. If not, see <http://www.gnu.org/licenses/>.
|
2014-01-24 10:37:15 +00:00
|
|
|
****************************************************************************/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* \file
|
2012-06-05 11:01:47 +00:00
|
|
|
*/
|
|
|
|
|
2013-09-18 09:16:03 +00:00
|
|
|
#include "encoder.h"
|
|
|
|
|
2012-06-05 11:01:47 +00:00
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
2013-09-09 15:32:16 +00:00
|
|
|
#include <assert.h>
|
2013-09-18 09:16:03 +00:00
|
|
|
|
2014-04-16 06:09:10 +00:00
|
|
|
#include "tables.h"
|
2012-06-05 11:01:47 +00:00
|
|
|
#include "config.h"
|
|
|
|
#include "cabac.h"
|
2014-06-05 12:54:58 +00:00
|
|
|
#include "image.h"
|
2012-06-05 12:38:54 +00:00
|
|
|
#include "nal.h"
|
2012-08-15 10:22:31 +00:00
|
|
|
#include "context.h"
|
2013-02-05 13:48:06 +00:00
|
|
|
#include "transform.h"
|
2013-03-07 15:42:00 +00:00
|
|
|
#include "intra.h"
|
2013-09-12 15:50:11 +00:00
|
|
|
#include "inter.h"
|
2013-04-04 12:08:28 +00:00
|
|
|
#include "filter.h"
|
2013-04-16 12:10:43 +00:00
|
|
|
#include "search.h"
|
2013-11-04 17:27:47 +00:00
|
|
|
#include "sao.h"
|
2014-01-28 10:14:43 +00:00
|
|
|
#include "rdo.h"
|
2012-06-05 11:01:47 +00:00
|
|
|
|
2015-05-27 12:41:45 +00:00
|
|
|
static int encoder_control_init_gop_layer_weights(encoder_control_t * const);
|
2014-05-08 10:00:23 +00:00
|
|
|
|
2015-06-30 06:14:31 +00:00
|
|
|
static int size_of_wpp_ends(int threads)
|
|
|
|
{
|
|
|
|
// Based on the shape of the area where all threads can't yet run in parallel.
|
|
|
|
return 4 * threads * threads - 2 * threads;
|
|
|
|
}
|
|
|
|
|
2015-06-30 08:03:26 +00:00
|
|
|
static int select_owf_auto(const kvz_config *const cfg)
|
2015-06-30 06:14:31 +00:00
|
|
|
{
|
|
|
|
if (cfg->wpp) {
|
|
|
|
// If wpp is on, select owf such that less than 15% of the
|
|
|
|
// frame is covered by the are threads can not work at the same time.
|
|
|
|
const int lcu_width = CEILDIV(cfg->width, LCU_WIDTH);
|
|
|
|
const int lcu_height = CEILDIV(cfg->height, LCU_WIDTH);
|
|
|
|
|
|
|
|
// Find the largest number of threads per frame that satifies the
|
|
|
|
// the condition: wpp start/stop inefficiency takes up less than 15%
|
|
|
|
// of frame area.
|
|
|
|
int threads_per_frame = 1;
|
|
|
|
const int wpp_treshold = lcu_width * lcu_height * 15 / 100;
|
|
|
|
while ((threads_per_frame + 1) * 2 < lcu_width &&
|
|
|
|
threads_per_frame + 1 < lcu_height &&
|
|
|
|
size_of_wpp_ends(threads_per_frame + 1) < wpp_treshold)
|
|
|
|
{
|
|
|
|
++threads_per_frame;
|
|
|
|
}
|
|
|
|
|
|
|
|
const int threads = MAX(cfg->threads, 1);
|
|
|
|
const int frames = CEILDIV(threads, threads_per_frame);
|
|
|
|
|
|
|
|
// Convert from number of parallel frames to number of additional frames.
|
|
|
|
return CLIP(0, threads - 1, frames - 1);
|
|
|
|
} else {
|
|
|
|
// If wpp is not on, select owf such that there is enough
|
|
|
|
// tiles for twice the number of threads.
|
|
|
|
|
|
|
|
int tiles_per_frame = 1;
|
|
|
|
if (cfg->tiles_width_count > 0) {
|
|
|
|
tiles_per_frame *= cfg->tiles_width_count + 1;
|
|
|
|
}
|
|
|
|
if (cfg->tiles_height_count > 0) {
|
|
|
|
tiles_per_frame *= cfg->tiles_height_count + 1;
|
|
|
|
}
|
|
|
|
int threads = (cfg->threads > 1 ? cfg->threads : 1);
|
|
|
|
int frames = CEILDIV(threads * 4, tiles_per_frame);
|
|
|
|
|
|
|
|
// Limit number of frames to 1.25x the number of threads for the case
|
|
|
|
// where there is only 1 tile per frame.
|
|
|
|
frames = CLIP(1, threads * 4 / 3, frames);
|
|
|
|
return frames - 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* \brief Allocate and initialize an encoder control structure.
|
|
|
|
*
|
|
|
|
* \param cfg encoder configuration
|
|
|
|
* \return initialized encoder control or NULL on failure
|
|
|
|
*/
|
2015-06-30 08:03:26 +00:00
|
|
|
encoder_control_t* encoder_control_init(const kvz_config *const cfg) {
|
2015-06-30 06:14:31 +00:00
|
|
|
encoder_control_t *encoder = NULL;
|
|
|
|
|
2014-01-31 18:34:50 +00:00
|
|
|
if (!cfg) {
|
|
|
|
fprintf(stderr, "Config object must not be null!\n");
|
2015-06-30 06:14:31 +00:00
|
|
|
goto init_failed;
|
2014-01-31 18:34:50 +00:00
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
|
|
|
// Make sure that the parameters make sense.
|
|
|
|
if (!config_validate(cfg)) {
|
|
|
|
goto init_failed;
|
|
|
|
}
|
|
|
|
|
|
|
|
encoder = calloc(1, sizeof(encoder_control_t));
|
|
|
|
if (!encoder) {
|
|
|
|
fprintf(stderr, "Failed to allocate encoder control.\n");
|
|
|
|
goto init_failed;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Need to set owf before initializing threadqueue.
|
|
|
|
if (cfg->owf >= 0) {
|
|
|
|
encoder->owf = cfg->owf;
|
|
|
|
} else {
|
|
|
|
encoder->owf = select_owf_auto(cfg);
|
|
|
|
fprintf(stderr, "--owf=auto value set to %d.\n", encoder->owf);
|
|
|
|
}
|
|
|
|
|
2015-03-04 14:30:20 +00:00
|
|
|
encoder->threadqueue = MALLOC(threadqueue_queue_t, 1);
|
2015-06-30 06:14:31 +00:00
|
|
|
if (!encoder->threadqueue ||
|
|
|
|
!threadqueue_init(encoder->threadqueue,
|
|
|
|
cfg->threads,
|
|
|
|
encoder->owf > 0)) {
|
|
|
|
fprintf(stderr, "Could not initialize threadqueue.\n");
|
|
|
|
goto init_failed;
|
2014-05-13 09:28:15 +00:00
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-17 12:42:20 +00:00
|
|
|
// Config pointer to config struct
|
|
|
|
encoder->cfg = cfg;
|
2015-08-11 05:42:09 +00:00
|
|
|
|
|
|
|
encoder->bitdepth = KVZ_BIT_DEPTH;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-01-31 18:34:50 +00:00
|
|
|
// deblocking filter
|
2014-04-17 12:42:20 +00:00
|
|
|
encoder->deblock_enable = 1;
|
|
|
|
encoder->beta_offset_div2 = 0;
|
|
|
|
encoder->tc_offset_div2 = 0;
|
2014-01-31 18:34:50 +00:00
|
|
|
// SAO
|
2014-04-17 12:42:20 +00:00
|
|
|
encoder->sao_enable = 1;
|
2014-04-07 11:36:01 +00:00
|
|
|
// Rate-distortion optimization level
|
2014-04-17 12:42:20 +00:00
|
|
|
encoder->rdo = 1;
|
2014-06-17 12:32:05 +00:00
|
|
|
encoder->full_intra_search = 0;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-01-31 18:34:50 +00:00
|
|
|
// Initialize the scaling list
|
2014-04-17 12:42:20 +00:00
|
|
|
scalinglist_init(&encoder->scaling_list);
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-15 12:20:26 +00:00
|
|
|
// CQM
|
|
|
|
{
|
|
|
|
FILE* cqmfile;
|
|
|
|
cqmfile = cfg->cqmfile ? fopen(cfg->cqmfile, "rb") : NULL;
|
|
|
|
if (cqmfile) {
|
2014-04-17 12:42:20 +00:00
|
|
|
scalinglist_parse(&encoder->scaling_list, cqmfile);
|
2014-04-15 12:20:26 +00:00
|
|
|
fclose(cqmfile);
|
|
|
|
}
|
|
|
|
}
|
2014-04-17 12:42:20 +00:00
|
|
|
scalinglist_process(&encoder->scaling_list, encoder->bitdepth);
|
2014-04-15 12:20:26 +00:00
|
|
|
|
2014-04-22 11:50:24 +00:00
|
|
|
encoder_control_input_init(encoder, cfg->width, cfg->height);
|
2015-05-27 12:41:45 +00:00
|
|
|
|
|
|
|
encoder->target_avg_bppic = cfg->target_bitrate / cfg->framerate;
|
|
|
|
encoder->target_avg_bpp = encoder->target_avg_bppic / encoder->in.pixels_per_pic;
|
|
|
|
|
|
|
|
if (!encoder_control_init_gop_layer_weights(encoder)) {
|
2015-06-30 06:14:31 +00:00
|
|
|
goto init_failed;
|
2015-05-27 12:41:45 +00:00
|
|
|
}
|
2014-04-22 11:50:24 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//Tiles
|
2015-06-30 06:14:31 +00:00
|
|
|
encoder->tiles_enable = encoder->cfg->tiles_width_count > 0 ||
|
|
|
|
encoder->cfg->tiles_height_count > 0;
|
|
|
|
|
2014-05-01 12:10:22 +00:00
|
|
|
{
|
2014-04-02 09:31:12 +00:00
|
|
|
int i, j; //iteration variables
|
|
|
|
const int num_ctbs = encoder->in.width_in_lcu * encoder->in.height_in_lcu;
|
|
|
|
int tileIdx, x, y; //iterations variable for 6-9
|
|
|
|
|
|
|
|
//Temporary pointers to allow encoder fields to be const
|
|
|
|
int32_t *tiles_col_width, *tiles_row_height, *tiles_ctb_addr_rs_to_ts, *tiles_ctb_addr_ts_to_rs, *tiles_tile_id, *tiles_col_bd, *tiles_row_bd;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-05-01 05:11:31 +00:00
|
|
|
if (encoder->cfg->tiles_width_count >= encoder->in.width_in_lcu) {
|
|
|
|
fprintf(stderr, "Too many tiles (width)!\n");
|
2015-06-30 06:14:31 +00:00
|
|
|
goto init_failed;
|
|
|
|
|
2014-05-01 05:11:31 +00:00
|
|
|
} else if (encoder->cfg->tiles_height_count >= encoder->in.height_in_lcu) {
|
|
|
|
fprintf(stderr, "Too many tiles (height)!\n");
|
2015-06-30 06:14:31 +00:00
|
|
|
goto init_failed;
|
2014-05-01 05:11:31 +00:00
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//Will be (perhaps) changed later
|
|
|
|
encoder->tiles_uniform_spacing_flag = 1;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//tilesn[x,y] contains the number of _separation_ between tiles, whereas the encoder needs the number of tiles.
|
|
|
|
encoder->tiles_num_tile_columns = encoder->cfg->tiles_width_count + 1;
|
|
|
|
encoder->tiles_num_tile_rows = encoder->cfg->tiles_height_count + 1;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
|
|
|
encoder->tiles_col_width = tiles_col_width =
|
|
|
|
MALLOC(int32_t, encoder->tiles_num_tile_columns);
|
|
|
|
encoder->tiles_row_height = tiles_row_height =
|
|
|
|
MALLOC(int32_t, encoder->tiles_num_tile_rows);
|
|
|
|
|
|
|
|
encoder->tiles_col_bd = tiles_col_bd =
|
2015-07-06 07:48:19 +00:00
|
|
|
MALLOC(int32_t, encoder->tiles_num_tile_columns + 1);
|
|
|
|
encoder->tiles_row_bd = tiles_row_bd =
|
2015-06-30 06:14:31 +00:00
|
|
|
MALLOC(int32_t, encoder->tiles_num_tile_rows + 1);
|
|
|
|
|
|
|
|
encoder->tiles_ctb_addr_rs_to_ts = tiles_ctb_addr_rs_to_ts =
|
|
|
|
MALLOC(int32_t, num_ctbs);
|
|
|
|
encoder->tiles_ctb_addr_ts_to_rs = tiles_ctb_addr_ts_to_rs =
|
|
|
|
MALLOC(int32_t, num_ctbs);
|
|
|
|
encoder->tiles_tile_id = tiles_tile_id =
|
|
|
|
MALLOC(int32_t, num_ctbs);
|
|
|
|
|
|
|
|
if (!tiles_col_width ||
|
|
|
|
!tiles_row_height ||
|
|
|
|
!tiles_row_bd ||
|
|
|
|
!tiles_col_bd ||
|
|
|
|
!tiles_ctb_addr_rs_to_ts ||
|
|
|
|
!tiles_ctb_addr_ts_to_rs ||
|
|
|
|
!tiles_tile_id) {
|
|
|
|
goto init_failed;
|
|
|
|
}
|
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//(6-3) and (6-4) in ITU-T Rec. H.265 (04/2013)
|
|
|
|
if (!encoder->cfg->tiles_width_split) {
|
|
|
|
for (i=0; i < encoder->tiles_num_tile_columns; ++i) {
|
|
|
|
tiles_col_width[i] = ((i+1) * encoder->in.width_in_lcu) / encoder->tiles_num_tile_columns -
|
|
|
|
i * encoder->in.width_in_lcu / encoder->tiles_num_tile_columns;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
int32_t last_pos_in_px = 0;
|
|
|
|
tiles_col_width[encoder->tiles_num_tile_columns-1] = encoder->in.width_in_lcu;
|
|
|
|
for (i=0; i < encoder->tiles_num_tile_columns - 1; ++i) {
|
|
|
|
int32_t column_width_in_lcu = (cfg->tiles_width_split[i] - last_pos_in_px) / LCU_WIDTH;
|
|
|
|
last_pos_in_px = cfg->tiles_width_split[i];
|
|
|
|
tiles_col_width[i] = column_width_in_lcu;
|
|
|
|
tiles_col_width[encoder->tiles_num_tile_columns - 1] -= column_width_in_lcu;
|
|
|
|
}
|
|
|
|
encoder->tiles_uniform_spacing_flag = 0;
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
if (!encoder->cfg->tiles_height_split) {
|
|
|
|
for (i=0; i < encoder->tiles_num_tile_rows; ++i) {
|
|
|
|
tiles_row_height[i] = ((i+1) * encoder->in.height_in_lcu) / encoder->tiles_num_tile_rows -
|
|
|
|
i * encoder->in.height_in_lcu / encoder->tiles_num_tile_rows;
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
int32_t last_pos_in_px = 0;
|
|
|
|
tiles_row_height[encoder->tiles_num_tile_rows-1] = encoder->in.height_in_lcu;
|
|
|
|
for (i=0; i < encoder->tiles_num_tile_rows - 1; ++i) {
|
|
|
|
int32_t row_height_in_lcu = (cfg->tiles_height_split[i] - last_pos_in_px) / LCU_WIDTH;
|
|
|
|
last_pos_in_px = cfg->tiles_height_split[i];
|
|
|
|
tiles_row_height[i] = row_height_in_lcu;
|
|
|
|
tiles_row_height[encoder->tiles_num_tile_rows - 1] -= row_height_in_lcu;
|
|
|
|
}
|
|
|
|
encoder->tiles_uniform_spacing_flag = 0;
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//(6-5) in ITU-T Rec. H.265 (04/2013)
|
|
|
|
tiles_col_bd[0] = 0;
|
|
|
|
for (i = 0; i < encoder->tiles_num_tile_columns; ++i) {
|
|
|
|
tiles_col_bd[i+1] = tiles_col_bd[i] + tiles_col_width[i];
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//(6-6) in ITU-T Rec. H.265 (04/2013)
|
|
|
|
tiles_row_bd[0] = 0;
|
|
|
|
for (i = 0; i < encoder->tiles_num_tile_rows; ++i) {
|
|
|
|
tiles_row_bd[i+1] = tiles_row_bd[i] + tiles_row_height[i];
|
|
|
|
}
|
|
|
|
|
|
|
|
//(6-7) in ITU-T Rec. H.265 (04/2013)
|
|
|
|
//j == ctbAddrRs
|
|
|
|
for (j = 0; j < num_ctbs; ++j) {
|
2014-04-24 06:41:05 +00:00
|
|
|
int tileX = 0, tileY = 0;
|
2014-04-02 09:31:12 +00:00
|
|
|
int tbX = j % encoder->in.width_in_lcu;
|
|
|
|
int tbY = j / encoder->in.width_in_lcu;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
for (i = 0; i < encoder->tiles_num_tile_columns; ++i) {
|
|
|
|
if (tbX >= tiles_col_bd[i]) tileX = i;
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
for (i = 0; i < encoder->tiles_num_tile_rows; ++i) {
|
|
|
|
if (tbY >= tiles_row_bd[i]) tileY = i;
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
tiles_ctb_addr_rs_to_ts[j] = 0;
|
|
|
|
for (i = 0; i < tileX; ++i) {
|
|
|
|
tiles_ctb_addr_rs_to_ts[j] += tiles_row_height[tileY] * tiles_col_width[i];
|
|
|
|
}
|
|
|
|
for (i = 0; i < tileY; ++i) {
|
|
|
|
tiles_ctb_addr_rs_to_ts[j] += encoder->in.width_in_lcu * tiles_row_height[i];
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
tiles_ctb_addr_rs_to_ts[j] += (tbY - tiles_row_bd[tileY]) * tiles_col_width[tileX] +
|
2014-04-02 09:31:12 +00:00
|
|
|
tbX - tiles_col_bd[tileX];
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//(6-8) in ITU-T Rec. H.265 (04/2013)
|
|
|
|
//Make reverse map from tile scan to raster scan
|
|
|
|
for (j = 0; j < num_ctbs; ++j) {
|
|
|
|
tiles_ctb_addr_ts_to_rs[tiles_ctb_addr_rs_to_ts[j]] = j;
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//(6-9) in ITU-T Rec. H.265 (04/2013)
|
|
|
|
tileIdx = 0;
|
|
|
|
for (j=0; j < encoder->tiles_num_tile_rows; ++j) {
|
|
|
|
for (i=0; i < encoder->tiles_num_tile_columns; ++i) {
|
|
|
|
for (y = tiles_row_bd[j]; y < tiles_row_bd[j+1]; ++y) {
|
|
|
|
for (x = tiles_col_bd[i]; x < tiles_col_bd[i+1]; ++x) {
|
|
|
|
tiles_tile_id[tiles_ctb_addr_rs_to_ts[y * encoder->in.width_in_lcu + x]] = tileIdx;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
++tileIdx;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2014-05-05 13:17:22 +00:00
|
|
|
//Slices
|
|
|
|
{
|
|
|
|
int *slice_addresses_in_ts;
|
|
|
|
encoder->slice_count = encoder->cfg->slice_count;
|
|
|
|
if (encoder->slice_count == 0) {
|
|
|
|
encoder->slice_count = 1;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
|
|
|
encoder->slice_addresses_in_ts = slice_addresses_in_ts =
|
|
|
|
MALLOC(int, encoder->slice_count);
|
|
|
|
if (!slice_addresses_in_ts) goto init_failed;
|
|
|
|
|
2014-05-05 13:17:22 +00:00
|
|
|
slice_addresses_in_ts[0] = 0;
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-05-05 13:17:22 +00:00
|
|
|
} else {
|
2015-06-30 06:14:31 +00:00
|
|
|
encoder->slice_addresses_in_ts = slice_addresses_in_ts =
|
|
|
|
MALLOC(int, encoder->slice_count);
|
|
|
|
if (!slice_addresses_in_ts) goto init_failed;
|
|
|
|
|
2014-05-05 13:17:22 +00:00
|
|
|
if (!encoder->cfg->slice_addresses_in_ts) {
|
|
|
|
slice_addresses_in_ts[0] = 0;
|
2015-06-30 06:14:31 +00:00
|
|
|
for (int i=1; i < encoder->slice_count; ++i) {
|
2014-05-05 13:17:22 +00:00
|
|
|
slice_addresses_in_ts[i] = encoder->in.width_in_lcu * encoder->in.height_in_lcu * i / encoder->slice_count;
|
|
|
|
}
|
|
|
|
} else {
|
2015-06-30 06:14:31 +00:00
|
|
|
for (int i=0; i < encoder->slice_count; ++i) {
|
2014-05-05 13:17:22 +00:00
|
|
|
slice_addresses_in_ts[i] = encoder->cfg->slice_addresses_in_ts[i];
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-05-05 13:17:22 +00:00
|
|
|
encoder->wpp = encoder->cfg->wpp;
|
2014-04-02 09:31:12 +00:00
|
|
|
|
2014-04-22 12:49:39 +00:00
|
|
|
#ifdef _DEBUG
|
|
|
|
printf("Tiles columns width:");
|
|
|
|
for (i=0; i < encoder->tiles_num_tile_columns; ++i) {
|
|
|
|
printf(" %d", encoder->tiles_col_width[i]);
|
|
|
|
}
|
|
|
|
printf("\n");
|
|
|
|
printf("Tiles row height:");
|
|
|
|
for (i=0; i < encoder->tiles_num_tile_rows; ++i) {
|
|
|
|
printf(" %d", encoder->tiles_row_height[i]);
|
|
|
|
}
|
|
|
|
printf("\n");
|
|
|
|
//Print tile index map
|
|
|
|
for (y = 0; y < encoder->in.height_in_lcu; ++y) {
|
|
|
|
for (x = 0; x < encoder->in.width_in_lcu; ++x) {
|
2014-05-05 13:17:22 +00:00
|
|
|
const int lcu_id_rs = y * encoder->in.width_in_lcu + x;
|
|
|
|
const int lcu_id_ts = encoder->tiles_ctb_addr_rs_to_ts[lcu_id_rs];
|
|
|
|
const char slice_start = lcu_at_slice_start(encoder, lcu_id_ts) ? '|' : ' ';
|
|
|
|
const char slice_end = lcu_at_slice_end(encoder, lcu_id_ts) ? '|' : ' ';
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-05-05 13:17:22 +00:00
|
|
|
printf("%c%03d%c", slice_start, encoder->tiles_tile_id[lcu_id_ts], slice_end);
|
2014-04-22 12:49:39 +00:00
|
|
|
}
|
|
|
|
printf("\n");
|
|
|
|
}
|
2014-05-05 13:17:22 +00:00
|
|
|
printf("\n");
|
|
|
|
if (encoder->wpp) {
|
|
|
|
printf("Wavefront Parallel Processing: enabled\n");
|
|
|
|
} else {
|
|
|
|
printf("Wavefront Parallel Processing: disabled\n");
|
|
|
|
}
|
|
|
|
printf("\n");
|
2014-04-22 12:49:39 +00:00
|
|
|
#endif //_DEBUG
|
2014-04-02 09:31:12 +00:00
|
|
|
}
|
2015-05-15 11:04:56 +00:00
|
|
|
|
2015-01-09 10:04:23 +00:00
|
|
|
assert(WITHIN(cfg->pu_depth_inter.min, PU_DEPTH_INTER_MIN, PU_DEPTH_INTER_MAX));
|
|
|
|
assert(WITHIN(cfg->pu_depth_inter.max, PU_DEPTH_INTER_MIN, PU_DEPTH_INTER_MAX));
|
2015-04-02 07:31:56 +00:00
|
|
|
assert(WITHIN(cfg->pu_depth_intra.min, PU_DEPTH_INTRA_MIN, PU_DEPTH_INTRA_MAX));
|
|
|
|
assert(WITHIN(cfg->pu_depth_intra.max, PU_DEPTH_INTRA_MIN, PU_DEPTH_INTRA_MAX));
|
2015-01-09 10:04:23 +00:00
|
|
|
encoder->pu_depth_inter.min = cfg->pu_depth_inter.min;
|
|
|
|
encoder->pu_depth_inter.max = cfg->pu_depth_inter.max;
|
|
|
|
encoder->pu_depth_intra.min = cfg->pu_depth_intra.min;
|
|
|
|
encoder->pu_depth_intra.max = cfg->pu_depth_intra.max;
|
|
|
|
|
2015-08-11 05:42:09 +00:00
|
|
|
// input init (TODO: read from commandline / config)
|
2015-05-15 11:04:56 +00:00
|
|
|
encoder->in.video_format = FORMAT_420;
|
|
|
|
|
|
|
|
// deblocking filter
|
|
|
|
encoder->deblock_enable = (int8_t)encoder->cfg->deblock_enable;
|
|
|
|
encoder->beta_offset_div2 = (int8_t)encoder->cfg->deblock_beta;
|
|
|
|
encoder->tc_offset_div2 = (int8_t)encoder->cfg->deblock_tc;
|
|
|
|
// SAO
|
|
|
|
encoder->sao_enable = (int8_t)encoder->cfg->sao_enable;
|
|
|
|
// RDO
|
|
|
|
encoder->rdoq_enable = (int8_t)encoder->cfg->rdoq_enable;
|
|
|
|
encoder->rdo = (int8_t)encoder->cfg->rdo;
|
|
|
|
encoder->sign_hiding = encoder->cfg->signhide_enable;
|
|
|
|
encoder->full_intra_search = (int8_t)encoder->cfg->full_intra_search;
|
|
|
|
// TR SKIP
|
|
|
|
encoder->trskip_enable = (int8_t)encoder->cfg->trskip_enable;
|
|
|
|
encoder->tr_depth_intra = (int8_t)encoder->cfg->tr_depth_intra;
|
|
|
|
// MOTION ESTIMATION
|
|
|
|
encoder->fme_level = (int8_t)encoder->cfg->fme_level;
|
|
|
|
// VUI
|
|
|
|
encoder->vui.sar_width = (int16_t)encoder->cfg->vui.sar_width;
|
|
|
|
encoder->vui.sar_height = (int16_t)encoder->cfg->vui.sar_height;
|
|
|
|
encoder->vui.overscan = encoder->cfg->vui.overscan;
|
|
|
|
encoder->vui.videoformat = encoder->cfg->vui.videoformat;
|
|
|
|
encoder->vui.fullrange = encoder->cfg->vui.fullrange;
|
|
|
|
encoder->vui.colorprim = encoder->cfg->vui.colorprim;
|
|
|
|
encoder->vui.transfer = encoder->cfg->vui.transfer;
|
|
|
|
encoder->vui.colormatrix = encoder->cfg->vui.colormatrix;
|
|
|
|
encoder->vui.chroma_loc = (int8_t)encoder->cfg->vui.chroma_loc;
|
|
|
|
// AUD
|
|
|
|
encoder->aud_enable = (int8_t)encoder->cfg->aud_enable;
|
|
|
|
|
|
|
|
encoder->vps_period = encoder->cfg->vps_period * encoder->cfg->intra_period;
|
|
|
|
|
2015-06-30 06:14:31 +00:00
|
|
|
return encoder;
|
|
|
|
|
|
|
|
init_failed:
|
|
|
|
encoder_control_free(encoder);
|
|
|
|
return NULL;
|
2014-04-17 12:42:20 +00:00
|
|
|
}
|
2014-01-31 18:34:50 +00:00
|
|
|
|
2015-06-30 06:14:31 +00:00
|
|
|
/**
|
|
|
|
* \brief Free an encoder control structure.
|
|
|
|
*/
|
|
|
|
void encoder_control_free(encoder_control_t *const encoder) {
|
|
|
|
if (!encoder) return;
|
|
|
|
|
2014-05-05 13:17:22 +00:00
|
|
|
//Slices
|
|
|
|
FREE_POINTER(encoder->slice_addresses_in_ts);
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-02 09:31:12 +00:00
|
|
|
//Tiles
|
2014-05-01 12:10:22 +00:00
|
|
|
FREE_POINTER(encoder->tiles_col_width);
|
|
|
|
FREE_POINTER(encoder->tiles_row_height);
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-05-01 12:10:22 +00:00
|
|
|
FREE_POINTER(encoder->tiles_col_bd);
|
|
|
|
FREE_POINTER(encoder->tiles_row_bd);
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-05-01 12:10:22 +00:00
|
|
|
FREE_POINTER(encoder->tiles_ctb_addr_rs_to_ts);
|
|
|
|
FREE_POINTER(encoder->tiles_ctb_addr_ts_to_rs);
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-05-01 12:10:22 +00:00
|
|
|
FREE_POINTER(encoder->tiles_tile_id);
|
2015-06-30 06:14:31 +00:00
|
|
|
|
2014-04-17 12:42:20 +00:00
|
|
|
scalinglist_destroy(&encoder->scaling_list);
|
2015-06-30 06:14:31 +00:00
|
|
|
|
|
|
|
if (encoder->threadqueue) {
|
|
|
|
threadqueue_finalize(encoder->threadqueue);
|
2014-05-13 09:28:15 +00:00
|
|
|
}
|
|
|
|
FREE_POINTER(encoder->threadqueue);
|
|
|
|
|
2015-06-30 06:14:31 +00:00
|
|
|
free(encoder);
|
2014-04-17 12:42:20 +00:00
|
|
|
}
|
2014-01-31 18:34:50 +00:00
|
|
|
|
2015-03-04 10:26:57 +00:00
|
|
|
void encoder_control_input_init(encoder_control_t * const encoder,
|
2014-05-07 07:56:16 +00:00
|
|
|
const int32_t width, const int32_t height)
|
|
|
|
{
|
|
|
|
encoder->in.width = width;
|
|
|
|
encoder->in.height = height;
|
|
|
|
encoder->in.real_width = width;
|
|
|
|
encoder->in.real_height = height;
|
2014-06-05 12:54:58 +00:00
|
|
|
encoder->in.bitdepth = encoder->bitdepth;
|
2014-05-07 07:56:16 +00:00
|
|
|
|
|
|
|
// If input dimensions are not divisible by the smallest block size, add
|
|
|
|
// pixels to the dimensions, so that they are. These extra pixels will be
|
|
|
|
// compressed along with the real ones but they will be cropped out before
|
|
|
|
// rendering.
|
|
|
|
if (encoder->in.width % CU_MIN_SIZE_PIXELS) {
|
|
|
|
encoder->in.width += CU_MIN_SIZE_PIXELS - (width % CU_MIN_SIZE_PIXELS);
|
|
|
|
}
|
|
|
|
|
|
|
|
if (encoder->in.height % CU_MIN_SIZE_PIXELS) {
|
|
|
|
encoder->in.height += CU_MIN_SIZE_PIXELS - (height % CU_MIN_SIZE_PIXELS);
|
|
|
|
}
|
|
|
|
|
|
|
|
encoder->in.height_in_lcu = encoder->in.height / LCU_WIDTH;
|
|
|
|
encoder->in.width_in_lcu = encoder->in.width / LCU_WIDTH;
|
|
|
|
|
|
|
|
// Add one extra LCU when image not divisible by LCU_WIDTH
|
|
|
|
if (encoder->in.height_in_lcu * LCU_WIDTH < height) {
|
|
|
|
encoder->in.height_in_lcu++;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (encoder->in.width_in_lcu * LCU_WIDTH < width) {
|
|
|
|
encoder->in.width_in_lcu++;
|
|
|
|
}
|
|
|
|
|
2015-05-27 12:41:45 +00:00
|
|
|
encoder->in.pixels_per_pic = encoder->in.width * encoder->in.height;
|
2014-05-07 07:56:16 +00:00
|
|
|
|
|
|
|
|
|
|
|
#ifdef _DEBUG
|
|
|
|
if (width != encoder->in.width || height != encoder->in.height) {
|
|
|
|
printf("Picture buffer has been extended to be a multiple of the smallest block size:\r\n");
|
|
|
|
printf(" Width = %d (%d), Height = %d (%d)\r\n", width, encoder->in.width, height,
|
|
|
|
encoder->in.height);
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
}
|
|
|
|
|
2015-05-27 12:41:45 +00:00
|
|
|
/**
|
|
|
|
* \brief Initialize GOP layer weights.
|
|
|
|
* \return 1 on success, 0 on failure.
|
|
|
|
*
|
|
|
|
* Selects appropriate weights for layers according to the target bpp.
|
|
|
|
* Only GOP structures with exactly four layers are supported.
|
|
|
|
*/
|
|
|
|
static int encoder_control_init_gop_layer_weights(encoder_control_t * const encoder)
|
|
|
|
{
|
|
|
|
|
2015-06-30 08:03:26 +00:00
|
|
|
kvz_gop_config const * const gop = encoder->cfg->gop;
|
2015-05-27 12:41:45 +00:00
|
|
|
const int8_t gop_len = encoder->cfg->gop_len;
|
|
|
|
|
|
|
|
int num_layers = 0;
|
|
|
|
for (int i = 0; i < gop_len; ++i) {
|
|
|
|
num_layers = MAX(gop[i].layer, num_layers);
|
|
|
|
}
|
|
|
|
|
|
|
|
switch (num_layers) {
|
|
|
|
case 0:
|
|
|
|
break;
|
|
|
|
|
|
|
|
case 4:
|
|
|
|
// These weights were copied from http://doi.org/10.1109/TIP.2014.2336550
|
|
|
|
if (encoder->target_avg_bpp <= 0.05) {
|
|
|
|
encoder->gop_layer_weights[0] = 30;
|
|
|
|
encoder->gop_layer_weights[1] = 8;
|
|
|
|
encoder->gop_layer_weights[2] = 4;
|
|
|
|
encoder->gop_layer_weights[3] = 1;
|
|
|
|
} else if (encoder->target_avg_bpp <= 0.1) {
|
|
|
|
encoder->gop_layer_weights[0] = 25;
|
|
|
|
encoder->gop_layer_weights[1] = 7;
|
|
|
|
encoder->gop_layer_weights[2] = 4;
|
|
|
|
encoder->gop_layer_weights[3] = 1;
|
|
|
|
} else if (encoder->target_avg_bpp <= 0.2) {
|
|
|
|
encoder->gop_layer_weights[0] = 20;
|
|
|
|
encoder->gop_layer_weights[1] = 6;
|
|
|
|
encoder->gop_layer_weights[2] = 4;
|
|
|
|
encoder->gop_layer_weights[3] = 1;
|
|
|
|
} else {
|
|
|
|
encoder->gop_layer_weights[0] = 15;
|
|
|
|
encoder->gop_layer_weights[1] = 5;
|
|
|
|
encoder->gop_layer_weights[2] = 4;
|
|
|
|
encoder->gop_layer_weights[3] = 1;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
|
|
|
|
default:
|
|
|
|
fprintf(stderr, "Unsupported number of GOP layers (%d)\n", num_layers);
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
|
|
|
// Normalize weights so that the sum of weights in a GOP is one.
|
|
|
|
double sum_weights = 0;
|
|
|
|
for (int i = 0; i < gop_len; ++i) {
|
|
|
|
sum_weights += encoder->gop_layer_weights[gop[i].layer - 1];
|
|
|
|
}
|
|
|
|
for (int i = 0; i < num_layers; ++i) {
|
|
|
|
encoder->gop_layer_weights[i] /= sum_weights;
|
|
|
|
}
|
|
|
|
|
|
|
|
return 1;
|
|
|
|
}
|