mirror of
https://github.com/ultravideo/uvg266.git
synced 2024-11-30 20:54:07 +00:00
402 lines
13 KiB
C
402 lines
13 KiB
C
/*****************************************************************************
|
|
* This file is part of Kvazaar HEVC encoder.
|
|
*
|
|
* Copyright (C) 2013-2015 Tampere University of Technology and others (see
|
|
* COPYING file).
|
|
*
|
|
* Kvazaar is free software: you can redistribute it and/or modify it under
|
|
* the terms of the GNU Lesser General Public License as published by the
|
|
* Free Software Foundation; either version 2.1 of the License, or (at your
|
|
* option) any later version.
|
|
*
|
|
* Kvazaar is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
* FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for
|
|
* more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License along
|
|
* with Kvazaar. If not, see <http://www.gnu.org/licenses/>.
|
|
****************************************************************************/
|
|
|
|
#include "kvazaar.h"
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <string.h>
|
|
|
|
#include "bitstream.h"
|
|
#include "cfg.h"
|
|
#include "checkpoint.h"
|
|
#include "encoder.h"
|
|
#include "encoder_state-bitstream.h"
|
|
#include "encoder_state-ctors_dtors.h"
|
|
#include "encoderstate.h"
|
|
#include "global.h"
|
|
#include "image.h"
|
|
#include "input_frame_buffer.h"
|
|
#include "kvazaar_internal.h"
|
|
#include "strategyselector.h"
|
|
#include "threadqueue.h"
|
|
#include "videoframe.h"
|
|
|
|
|
|
static void kvazaar_close(kvz_encoder *encoder)
|
|
{
|
|
if (encoder) {
|
|
// The threadqueue must be stopped before freeing states.
|
|
if (encoder->control) {
|
|
kvz_threadqueue_stop(encoder->control->threadqueue);
|
|
}
|
|
|
|
if (encoder->states) {
|
|
// Flush input frame buffer.
|
|
kvz_picture *pic = NULL;
|
|
while ((pic = kvz_encoder_feed_frame(&encoder->input_buffer,
|
|
&encoder->states[0],
|
|
NULL)) != NULL) {
|
|
kvz_image_free(pic);
|
|
pic = NULL;
|
|
}
|
|
|
|
for (unsigned i = 0; i < encoder->num_encoder_states; ++i) {
|
|
kvz_encoder_state_finalize(&encoder->states[i]);
|
|
}
|
|
}
|
|
FREE_POINTER(encoder->states);
|
|
|
|
// Discard const from the pointer.
|
|
kvz_encoder_control_free((void*) encoder->control);
|
|
encoder->control = NULL;
|
|
}
|
|
FREE_POINTER(encoder);
|
|
}
|
|
|
|
|
|
static kvz_encoder * kvazaar_open(const kvz_config *cfg)
|
|
{
|
|
kvz_encoder *encoder = NULL;
|
|
|
|
//Initialize strategies
|
|
// TODO: Make strategies non-global
|
|
if (!kvz_strategyselector_init(cfg->cpuid, KVZ_BIT_DEPTH)) {
|
|
fprintf(stderr, "Failed to initialize strategies.\n");
|
|
goto kvazaar_open_failure;
|
|
}
|
|
|
|
encoder = calloc(1, sizeof(kvz_encoder));
|
|
if (!encoder) {
|
|
goto kvazaar_open_failure;
|
|
}
|
|
|
|
encoder->control = kvz_encoder_control_init(cfg);
|
|
if (!encoder->control) {
|
|
goto kvazaar_open_failure;
|
|
}
|
|
|
|
encoder->num_encoder_states = encoder->control->cfg.owf + 1;
|
|
encoder->cur_state_num = 0;
|
|
encoder->out_state_num = 0;
|
|
encoder->frames_started = 0;
|
|
encoder->frames_done = 0;
|
|
|
|
kvz_init_input_frame_buffer(&encoder->input_buffer);
|
|
|
|
encoder->states = calloc(encoder->num_encoder_states, sizeof(encoder_state_t));
|
|
if (!encoder->states) {
|
|
goto kvazaar_open_failure;
|
|
}
|
|
|
|
for (unsigned i = 0; i < encoder->num_encoder_states; ++i) {
|
|
encoder->states[i].encoder_control = encoder->control;
|
|
|
|
if (!kvz_encoder_state_init(&encoder->states[i], NULL)) {
|
|
goto kvazaar_open_failure;
|
|
}
|
|
|
|
encoder->states[i].frame->QP = (int8_t)cfg->qp;
|
|
}
|
|
|
|
for (int i = 0; i < encoder->num_encoder_states; ++i) {
|
|
if (i == 0) {
|
|
encoder->states[i].previous_encoder_state = &encoder->states[encoder->num_encoder_states - 1];
|
|
} else {
|
|
encoder->states[i].previous_encoder_state = &encoder->states[(i - 1) % encoder->num_encoder_states];
|
|
}
|
|
kvz_encoder_state_match_children_of_previous_frame(&encoder->states[i]);
|
|
}
|
|
|
|
encoder->states[encoder->cur_state_num].frame->num = -1;
|
|
|
|
return encoder;
|
|
|
|
kvazaar_open_failure:
|
|
kvazaar_close(encoder);
|
|
return NULL;
|
|
}
|
|
|
|
|
|
static void set_frame_info(kvz_frame_info *const info, const encoder_state_t *const state)
|
|
{
|
|
info->poc = state->frame->poc,
|
|
info->qp = state->frame->QP;
|
|
info->nal_unit_type = state->frame->pictype;
|
|
info->slice_type = state->frame->slicetype;
|
|
|
|
memset(info->ref_list[0], 0, 16 * sizeof(int));
|
|
memset(info->ref_list[1], 0, 16 * sizeof(int));
|
|
|
|
for (size_t i = 0; i < state->frame->ref_LX_size[0]; i++) {
|
|
info->ref_list[0][i] = state->frame->ref->pocs[state->frame->ref_LX[0][i]];
|
|
}
|
|
|
|
for (size_t i = 0; i < state->frame->ref_LX_size[1]; i++) {
|
|
info->ref_list[1][i] = state->frame->ref->pocs[state->frame->ref_LX[1][i]];
|
|
}
|
|
|
|
info->ref_list_len[0] = state->frame->ref_LX_size[0];
|
|
info->ref_list_len[1] = state->frame->ref_LX_size[1];
|
|
}
|
|
|
|
|
|
static int kvazaar_headers(kvz_encoder *enc,
|
|
kvz_data_chunk **data_out,
|
|
uint32_t *len_out)
|
|
{
|
|
if (data_out) *data_out = NULL;
|
|
if (len_out) *len_out = 0;
|
|
|
|
bitstream_t stream;
|
|
kvz_bitstream_init(&stream);
|
|
|
|
kvz_encoder_state_write_parameter_sets(&stream, &enc->states[enc->cur_state_num]);
|
|
|
|
// Get stream length before taking chunks since that clears the stream.
|
|
if (len_out) *len_out = kvz_bitstream_tell(&stream) / 8;
|
|
if (data_out) *data_out = kvz_bitstream_take_chunks(&stream);
|
|
|
|
kvz_bitstream_finalize(&stream);
|
|
return 1;
|
|
}
|
|
|
|
|
|
/**
|
|
* \brief Separate a single field from a frame.
|
|
*
|
|
* \param frame_in input frame to extract field from
|
|
* \param source_scan_type scan type of input material (0: progressive, 1:top field first, 2:bottom field first)
|
|
* \param field parity
|
|
* \param field_out
|
|
*
|
|
* \return 1 on success, 0 on failure
|
|
*/
|
|
static int yuv_io_extract_field(const kvz_picture *frame_in, unsigned source_scan_type, unsigned field_parity, kvz_picture *field_out)
|
|
{
|
|
if ((source_scan_type != 1) && (source_scan_type != 2)) return 0;
|
|
if ((field_parity != 0) && (field_parity != 1)) return 0;
|
|
|
|
unsigned offset = 0;
|
|
if (source_scan_type == 1) offset = field_parity ? 1 : 0;
|
|
else if (source_scan_type == 2) offset = field_parity ? 0 : 1;
|
|
|
|
//Luma
|
|
for (int i = 0; i < field_out->height; ++i){
|
|
kvz_pixel *row_in = frame_in->y + MIN(frame_in->height - 1, 2 * i + offset) * frame_in->stride;
|
|
kvz_pixel *row_out = field_out->y + i * field_out->stride;
|
|
memcpy(row_out, row_in, sizeof(kvz_pixel) * frame_in->width);
|
|
}
|
|
|
|
//Chroma
|
|
for (int i = 0; i < field_out->height / 2; ++i){
|
|
kvz_pixel *row_in = frame_in->u + MIN(frame_in->height / 2 - 1, 2 * i + offset) * frame_in->stride / 2;
|
|
kvz_pixel *row_out = field_out->u + i * field_out->stride / 2;
|
|
memcpy(row_out, row_in, sizeof(kvz_pixel) * frame_in->width / 2);
|
|
}
|
|
|
|
for (int i = 0; i < field_out->height / 2; ++i){
|
|
kvz_pixel *row_in = frame_in->v + MIN(frame_in->height / 2 - 1, 2 * i + offset) * frame_in->stride / 2;
|
|
kvz_pixel *row_out = field_out->v + i * field_out->stride / 2;
|
|
memcpy(row_out, row_in, sizeof(kvz_pixel) * frame_in->width / 2);
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
|
|
static int kvazaar_encode(kvz_encoder *enc,
|
|
kvz_picture *pic_in,
|
|
kvz_data_chunk **data_out,
|
|
uint32_t *len_out,
|
|
kvz_picture **pic_out,
|
|
kvz_picture **src_out,
|
|
kvz_frame_info *info_out)
|
|
{
|
|
if (data_out) *data_out = NULL;
|
|
if (len_out) *len_out = 0;
|
|
if (pic_out) *pic_out = NULL;
|
|
if (src_out) *src_out = NULL;
|
|
|
|
encoder_state_t *state = &enc->states[enc->cur_state_num];
|
|
|
|
if (!state->frame->prepared) {
|
|
kvz_encoder_prepare(state);
|
|
}
|
|
|
|
if (pic_in != NULL) {
|
|
// FIXME: The frame number printed here is wrong when GOP is enabled.
|
|
CHECKPOINT_MARK("read source frame: %d", state->frame->num + enc->control->cfg.seek);
|
|
}
|
|
|
|
kvz_picture* frame = kvz_encoder_feed_frame(&enc->input_buffer, state, pic_in);
|
|
if (frame) {
|
|
assert(state->frame->num == enc->frames_started);
|
|
// Start encoding.
|
|
kvz_encode_one_frame(state, frame);
|
|
enc->frames_started += 1;
|
|
}
|
|
|
|
// If we have finished encoding as many frames as we have started, we are done.
|
|
if (enc->frames_done == enc->frames_started) {
|
|
return 1;
|
|
}
|
|
|
|
if (!state->frame->done) {
|
|
// We started encoding a frame; move to the next encoder state.
|
|
enc->cur_state_num = (enc->cur_state_num + 1) % (enc->num_encoder_states);
|
|
}
|
|
|
|
encoder_state_t *output_state = &enc->states[enc->out_state_num];
|
|
if (!output_state->frame->done &&
|
|
(pic_in == NULL || enc->cur_state_num == enc->out_state_num)) {
|
|
|
|
kvz_threadqueue_waitfor(enc->control->threadqueue, output_state->tqj_bitstream_written);
|
|
// The job pointer must be set to NULL here since it won't be usable after
|
|
// the next frame is done.
|
|
kvz_threadqueue_free_job(&output_state->tqj_bitstream_written);
|
|
|
|
// Get stream length before taking chunks since that clears the stream.
|
|
if (len_out) *len_out = kvz_bitstream_tell(&output_state->stream) / 8;
|
|
if (data_out) *data_out = kvz_bitstream_take_chunks(&output_state->stream);
|
|
if (pic_out) *pic_out = kvz_image_copy_ref(output_state->tile->frame->rec);
|
|
if (src_out) *src_out = kvz_image_copy_ref(output_state->tile->frame->source);
|
|
if (info_out) set_frame_info(info_out, output_state);
|
|
|
|
output_state->frame->done = 1;
|
|
output_state->frame->prepared = 0;
|
|
enc->frames_done += 1;
|
|
|
|
enc->out_state_num = (enc->out_state_num + 1) % (enc->num_encoder_states);
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
|
|
static int kvazaar_field_encoding_adapter(kvz_encoder *enc,
|
|
kvz_picture *pic_in,
|
|
kvz_data_chunk **data_out,
|
|
uint32_t *len_out,
|
|
kvz_picture **pic_out,
|
|
kvz_picture **src_out,
|
|
kvz_frame_info *info_out)
|
|
{
|
|
if (enc->control->cfg.source_scan_type == KVZ_INTERLACING_NONE) {
|
|
// For progressive, simply call the normal encoding function.
|
|
return kvazaar_encode(enc, pic_in, data_out, len_out, pic_out, src_out, info_out);
|
|
}
|
|
|
|
// For interlaced, make two fields out of the input frame and call encode on them separately.
|
|
encoder_state_t *state = &enc->states[enc->cur_state_num];
|
|
kvz_picture *first_field = NULL, *second_field = NULL;
|
|
struct {
|
|
kvz_data_chunk* data_out;
|
|
uint32_t len_out;
|
|
} first = { 0, 0 }, second = { 0, 0 };
|
|
|
|
if (pic_in != NULL) {
|
|
first_field = kvz_image_alloc(state->encoder_control->chroma_format, state->encoder_control->in.width, state->encoder_control->in.height);
|
|
if (first_field == NULL) {
|
|
goto kvazaar_field_encoding_adapter_failure;
|
|
}
|
|
second_field = kvz_image_alloc(state->encoder_control->chroma_format, state->encoder_control->in.width, state->encoder_control->in.height);
|
|
if (second_field == NULL) {
|
|
goto kvazaar_field_encoding_adapter_failure;
|
|
}
|
|
|
|
yuv_io_extract_field(pic_in, pic_in->interlacing, 0, first_field);
|
|
yuv_io_extract_field(pic_in, pic_in->interlacing, 1, second_field);
|
|
|
|
first_field->pts = pic_in->pts;
|
|
first_field->dts = pic_in->dts;
|
|
first_field->interlacing = pic_in->interlacing;
|
|
|
|
// Should the second field have higher pts and dts? It shouldn't affect anything.
|
|
second_field->pts = pic_in->pts;
|
|
second_field->dts = pic_in->dts;
|
|
second_field->interlacing = pic_in->interlacing;
|
|
}
|
|
|
|
if (!kvazaar_encode(enc, first_field, &first.data_out, &first.len_out, pic_out, NULL, info_out)) {
|
|
goto kvazaar_field_encoding_adapter_failure;
|
|
}
|
|
if (!kvazaar_encode(enc, second_field, &second.data_out, &second.len_out, NULL, NULL, NULL)) {
|
|
goto kvazaar_field_encoding_adapter_failure;
|
|
}
|
|
|
|
kvz_image_free(first_field);
|
|
kvz_image_free(second_field);
|
|
|
|
// Concatenate bitstreams.
|
|
if (len_out != NULL) {
|
|
*len_out = first.len_out + second.len_out;
|
|
}
|
|
if (data_out != NULL) {
|
|
*data_out = first.data_out;
|
|
if (first.data_out != NULL) {
|
|
kvz_data_chunk *chunk = first.data_out;
|
|
while (chunk->next != NULL) {
|
|
chunk = chunk->next;
|
|
}
|
|
chunk->next = second.data_out;
|
|
}
|
|
}
|
|
|
|
if (src_out != NULL) {
|
|
// TODO: deinterlace the fields to one picture.
|
|
}
|
|
|
|
return 1;
|
|
|
|
kvazaar_field_encoding_adapter_failure:
|
|
kvz_image_free(first_field);
|
|
kvz_image_free(second_field);
|
|
kvz_bitstream_free_chunks(first.data_out);
|
|
kvz_bitstream_free_chunks(second.data_out);
|
|
return 0;
|
|
}
|
|
|
|
|
|
static const kvz_api kvz_8bit_api = {
|
|
.config_alloc = kvz_config_alloc,
|
|
.config_init = kvz_config_init,
|
|
.config_destroy = kvz_config_destroy,
|
|
.config_parse = kvz_config_parse,
|
|
|
|
.picture_alloc = kvz_image_alloc_420,
|
|
.picture_free = kvz_image_free,
|
|
|
|
.chunk_free = kvz_bitstream_free_chunks,
|
|
|
|
.encoder_open = kvazaar_open,
|
|
.encoder_close = kvazaar_close,
|
|
.encoder_headers = kvazaar_headers,
|
|
.encoder_encode = kvazaar_field_encoding_adapter,
|
|
|
|
.picture_alloc_csp = kvz_image_alloc,
|
|
};
|
|
|
|
|
|
const kvz_api * kvz_api_get(int bit_depth)
|
|
{
|
|
return &kvz_8bit_api;
|
|
}
|