uvg266/src/kvazaar.c
Arttu Ylä-Outinen 2991962033 Add reference counting to threadequeue_job_t
Both the thread queue and the encoder states hold pointers to the thread
queue jobs. It is possible that a job is removed from the thread queue
and freed while the encoder state is still using it. This commit adds
reference counting to threadqueue_job_t in order to fix the problem.

Fixes #161.
2017-04-12 16:13:52 +03:00

375 lines
12 KiB
C

/*****************************************************************************
* This file is part of Kvazaar HEVC encoder.
*
* Copyright (C) 2013-2015 Tampere University of Technology and others (see
* COPYING file).
*
* Kvazaar is free software: you can redistribute it and/or modify it under
* the terms of the GNU Lesser General Public License as published by the
* Free Software Foundation; either version 2.1 of the License, or (at your
* option) any later version.
*
* Kvazaar is distributed in the hope that it will be useful, but WITHOUT ANY
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
* FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for
* more details.
*
* You should have received a copy of the GNU General Public License along
* with Kvazaar. If not, see <http://www.gnu.org/licenses/>.
****************************************************************************/
#include "kvazaar.h"
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "bitstream.h"
#include "cfg.h"
#include "checkpoint.h"
#include "encoder.h"
#include "encoder_state-bitstream.h"
#include "encoder_state-ctors_dtors.h"
#include "encoderstate.h"
#include "global.h"
#include "image.h"
#include "input_frame_buffer.h"
#include "kvazaar_internal.h"
#include "strategyselector.h"
#include "threadqueue.h"
#include "videoframe.h"
static void kvazaar_close(kvz_encoder *encoder)
{
if (encoder) {
if (encoder->states) {
for (unsigned i = 0; i < encoder->num_encoder_states; ++i) {
kvz_encoder_state_finalize(&encoder->states[i]);
}
}
FREE_POINTER(encoder->states);
// Discard const from the pointer.
kvz_encoder_control_free((void*) encoder->control);
encoder->control = NULL;
}
FREE_POINTER(encoder);
}
static kvz_encoder * kvazaar_open(const kvz_config *cfg)
{
kvz_encoder *encoder = NULL;
//Initialize strategies
// TODO: Make strategies non-global
if (!kvz_strategyselector_init(cfg->cpuid, KVZ_BIT_DEPTH)) {
fprintf(stderr, "Failed to initialize strategies.\n");
goto kvazaar_open_failure;
}
encoder = calloc(1, sizeof(kvz_encoder));
if (!encoder) {
goto kvazaar_open_failure;
}
encoder->control = kvz_encoder_control_init(cfg);
if (!encoder->control) {
goto kvazaar_open_failure;
}
encoder->num_encoder_states = encoder->control->cfg.owf + 1;
encoder->cur_state_num = 0;
encoder->out_state_num = 0;
encoder->frames_started = 0;
encoder->frames_done = 0;
kvz_init_input_frame_buffer(&encoder->input_buffer);
encoder->states = calloc(encoder->num_encoder_states, sizeof(encoder_state_t));
if (!encoder->states) {
goto kvazaar_open_failure;
}
for (unsigned i = 0; i < encoder->num_encoder_states; ++i) {
encoder->states[i].encoder_control = encoder->control;
if (!kvz_encoder_state_init(&encoder->states[i], NULL)) {
goto kvazaar_open_failure;
}
encoder->states[i].frame->QP = (int8_t)cfg->qp;
}
for (int i = 0; i < encoder->num_encoder_states; ++i) {
if (i == 0) {
encoder->states[i].previous_encoder_state = &encoder->states[encoder->num_encoder_states - 1];
} else {
encoder->states[i].previous_encoder_state = &encoder->states[(i - 1) % encoder->num_encoder_states];
}
kvz_encoder_state_match_children_of_previous_frame(&encoder->states[i]);
}
encoder->states[encoder->cur_state_num].frame->num = -1;
return encoder;
kvazaar_open_failure:
kvazaar_close(encoder);
return NULL;
}
static void set_frame_info(kvz_frame_info *const info, const encoder_state_t *const state)
{
info->poc = state->frame->poc,
info->qp = state->frame->QP;
info->nal_unit_type = state->frame->pictype;
info->slice_type = state->frame->slicetype;
kvz_encoder_get_ref_lists(state, info->ref_list_len, info->ref_list);
}
static int kvazaar_headers(kvz_encoder *enc,
kvz_data_chunk **data_out,
uint32_t *len_out)
{
if (data_out) *data_out = NULL;
if (len_out) *len_out = 0;
bitstream_t stream;
kvz_bitstream_init(&stream);
kvz_encoder_state_write_parameter_sets(&stream, &enc->states[enc->cur_state_num]);
// Get stream length before taking chunks since that clears the stream.
if (len_out) *len_out = kvz_bitstream_tell(&stream) / 8;
if (data_out) *data_out = kvz_bitstream_take_chunks(&stream);
kvz_bitstream_finalize(&stream);
return 1;
}
/**
* \brief Separate a single field from a frame.
*
* \param frame_in input frame to extract field from
* \param source_scan_type scan type of input material (0: progressive, 1:top field first, 2:bottom field first)
* \param field parity
* \param field_out
*
* \return 1 on success, 0 on failure
*/
static int yuv_io_extract_field(const kvz_picture *frame_in, unsigned source_scan_type, unsigned field_parity, kvz_picture *field_out)
{
if ((source_scan_type != 1) && (source_scan_type != 2)) return 0;
if ((field_parity != 0) && (field_parity != 1)) return 0;
unsigned offset = 0;
if (source_scan_type == 1) offset = field_parity ? 1 : 0;
else if (source_scan_type == 2) offset = field_parity ? 0 : 1;
//Luma
for (int i = 0; i < field_out->height; ++i){
kvz_pixel *row_in = frame_in->y + MIN(frame_in->height - 1, 2 * i + offset) * frame_in->stride;
kvz_pixel *row_out = field_out->y + i * field_out->stride;
memcpy(row_out, row_in, sizeof(kvz_pixel) * frame_in->width);
}
//Chroma
for (int i = 0; i < field_out->height / 2; ++i){
kvz_pixel *row_in = frame_in->u + MIN(frame_in->height / 2 - 1, 2 * i + offset) * frame_in->stride / 2;
kvz_pixel *row_out = field_out->u + i * field_out->stride / 2;
memcpy(row_out, row_in, sizeof(kvz_pixel) * frame_in->width / 2);
}
for (int i = 0; i < field_out->height / 2; ++i){
kvz_pixel *row_in = frame_in->v + MIN(frame_in->height / 2 - 1, 2 * i + offset) * frame_in->stride / 2;
kvz_pixel *row_out = field_out->v + i * field_out->stride / 2;
memcpy(row_out, row_in, sizeof(kvz_pixel) * frame_in->width / 2);
}
return 1;
}
static int kvazaar_encode(kvz_encoder *enc,
kvz_picture *pic_in,
kvz_data_chunk **data_out,
uint32_t *len_out,
kvz_picture **pic_out,
kvz_picture **src_out,
kvz_frame_info *info_out)
{
if (data_out) *data_out = NULL;
if (len_out) *len_out = 0;
if (pic_out) *pic_out = NULL;
if (src_out) *src_out = NULL;
encoder_state_t *state = &enc->states[enc->cur_state_num];
if (!state->frame->prepared) {
kvz_encoder_prepare(state);
}
if (pic_in != NULL) {
// FIXME: The frame number printed here is wrong when GOP is enabled.
CHECKPOINT_MARK("read source frame: %d", state->frame->num + enc->control->cfg.seek);
}
kvz_picture* frame = kvz_encoder_feed_frame(&enc->input_buffer, state, pic_in);
if (frame) {
assert(state->frame->num == enc->frames_started);
// Start encoding.
kvz_encode_one_frame(state, frame);
enc->frames_started += 1;
}
// If we have finished encoding as many frames as we have started, we are done.
if (enc->frames_done == enc->frames_started) {
return 1;
}
if (!state->frame->done) {
// We started encoding a frame; move to the next encoder state.
enc->cur_state_num = (enc->cur_state_num + 1) % (enc->num_encoder_states);
}
encoder_state_t *output_state = &enc->states[enc->out_state_num];
if (!output_state->frame->done &&
(pic_in == NULL || enc->cur_state_num == enc->out_state_num)) {
kvz_threadqueue_waitfor(enc->control->threadqueue, output_state->tqj_bitstream_written);
// The job pointer must be set to NULL here since it won't be usable after
// the next frame is done.
kvz_threadqueue_free_job(&output_state->tqj_bitstream_written);
// Get stream length before taking chunks since that clears the stream.
if (len_out) *len_out = kvz_bitstream_tell(&output_state->stream) / 8;
if (data_out) *data_out = kvz_bitstream_take_chunks(&output_state->stream);
if (pic_out) *pic_out = kvz_image_copy_ref(output_state->tile->frame->rec);
if (src_out) *src_out = kvz_image_copy_ref(output_state->tile->frame->source);
if (info_out) set_frame_info(info_out, output_state);
output_state->frame->done = 1;
output_state->frame->prepared = 0;
enc->frames_done += 1;
enc->out_state_num = (enc->out_state_num + 1) % (enc->num_encoder_states);
}
return 1;
}
static int kvazaar_field_encoding_adapter(kvz_encoder *enc,
kvz_picture *pic_in,
kvz_data_chunk **data_out,
uint32_t *len_out,
kvz_picture **pic_out,
kvz_picture **src_out,
kvz_frame_info *info_out)
{
if (enc->control->cfg.source_scan_type == KVZ_INTERLACING_NONE) {
// For progressive, simply call the normal encoding function.
return kvazaar_encode(enc, pic_in, data_out, len_out, pic_out, src_out, info_out);
}
// For interlaced, make two fields out of the input frame and call encode on them separately.
encoder_state_t *state = &enc->states[enc->cur_state_num];
kvz_picture *first_field = NULL, *second_field = NULL;
struct {
kvz_data_chunk* data_out;
uint32_t len_out;
} first = { 0, 0 }, second = { 0, 0 };
if (pic_in != NULL) {
first_field = kvz_image_alloc(state->encoder_control->chroma_format, state->encoder_control->in.width, state->encoder_control->in.height);
if (first_field == NULL) {
goto kvazaar_field_encoding_adapter_failure;
}
second_field = kvz_image_alloc(state->encoder_control->chroma_format, state->encoder_control->in.width, state->encoder_control->in.height);
if (second_field == NULL) {
goto kvazaar_field_encoding_adapter_failure;
}
yuv_io_extract_field(pic_in, pic_in->interlacing, 0, first_field);
yuv_io_extract_field(pic_in, pic_in->interlacing, 1, second_field);
first_field->pts = pic_in->pts;
first_field->dts = pic_in->dts;
first_field->interlacing = pic_in->interlacing;
// Should the second field have higher pts and dts? It shouldn't affect anything.
second_field->pts = pic_in->pts;
second_field->dts = pic_in->dts;
second_field->interlacing = pic_in->interlacing;
}
if (!kvazaar_encode(enc, first_field, &first.data_out, &first.len_out, pic_out, NULL, info_out)) {
goto kvazaar_field_encoding_adapter_failure;
}
if (!kvazaar_encode(enc, second_field, &second.data_out, &second.len_out, NULL, NULL, NULL)) {
goto kvazaar_field_encoding_adapter_failure;
}
kvz_image_free(first_field);
kvz_image_free(second_field);
// Concatenate bitstreams.
if (len_out != NULL) {
*len_out = first.len_out + second.len_out;
}
if (data_out != NULL) {
*data_out = first.data_out;
if (first.data_out != NULL) {
kvz_data_chunk *chunk = first.data_out;
while (chunk->next != NULL) {
chunk = chunk->next;
}
chunk->next = second.data_out;
}
}
if (src_out != NULL) {
// TODO: deinterlace the fields to one picture.
}
return 1;
kvazaar_field_encoding_adapter_failure:
kvz_image_free(first_field);
kvz_image_free(second_field);
kvz_bitstream_free_chunks(first.data_out);
kvz_bitstream_free_chunks(second.data_out);
return 0;
}
static const kvz_api kvz_8bit_api = {
.config_alloc = kvz_config_alloc,
.config_init = kvz_config_init,
.config_destroy = kvz_config_destroy,
.config_parse = kvz_config_parse,
.picture_alloc = kvz_image_alloc_420,
.picture_free = kvz_image_free,
.chunk_free = kvz_bitstream_free_chunks,
.encoder_open = kvazaar_open,
.encoder_close = kvazaar_close,
.encoder_headers = kvazaar_headers,
.encoder_encode = kvazaar_field_encoding_adapter,
.picture_alloc_csp = kvz_image_alloc,
};
const kvz_api * kvz_api_get(int bit_depth)
{
return &kvz_8bit_api;
}