2014-11-20 16:38:54 +00:00
|
|
|
#ifndef STRATEGIES_IPOL_H_
|
|
|
|
#define STRATEGIES_IPOL_H_
|
|
|
|
/*****************************************************************************
|
|
|
|
* This file is part of Kvazaar HEVC encoder.
|
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* Copyright (C) 2013-2015 Tampere University of Technology and others (see
|
2014-11-20 16:38:54 +00:00
|
|
|
* COPYING file).
|
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* Kvazaar is free software: you can redistribute it and/or modify it under
|
|
|
|
* the terms of the GNU Lesser General Public License as published by the
|
|
|
|
* Free Software Foundation; either version 2.1 of the License, or (at your
|
|
|
|
* option) any later version.
|
2014-11-20 16:38:54 +00:00
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* Kvazaar is distributed in the hope that it will be useful, but WITHOUT ANY
|
|
|
|
* WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
|
|
|
|
* FOR A PARTICULAR PURPOSE. See the GNU Lesser General Public License for
|
|
|
|
* more details.
|
2014-11-20 16:38:54 +00:00
|
|
|
*
|
2015-02-23 11:18:48 +00:00
|
|
|
* You should have received a copy of the GNU General Public License along
|
|
|
|
* with Kvazaar. If not, see <http://www.gnu.org/licenses/>.
|
2014-11-20 16:38:54 +00:00
|
|
|
****************************************************************************/
|
2015-12-17 11:42:57 +00:00
|
|
|
|
|
|
|
/**
|
|
|
|
* \ingroup Optimization
|
|
|
|
* \file
|
|
|
|
* Interface for subpixel interpolation functions.
|
|
|
|
*/
|
|
|
|
|
2016-04-01 14:14:23 +00:00
|
|
|
#include "encoder.h"
|
2016-03-30 09:41:37 +00:00
|
|
|
#include "global.h" // IWYU pragma: keep
|
2016-04-01 14:14:23 +00:00
|
|
|
#include "kvazaar.h"
|
2016-07-12 15:03:52 +00:00
|
|
|
#include "search_inter.h"
|
2016-01-22 13:07:49 +00:00
|
|
|
|
2021-03-06 23:27:55 +00:00
|
|
|
// AVX2 implementation of horizontal filter reads and
|
|
|
|
// writes two rows for luma and four for chroma at a time.
|
|
|
|
// Extra vertical padding is added to prevent segfaults.
|
|
|
|
// Horizontal padding is not needed even if one extra byte
|
|
|
|
// is read because kvz_image_alloc adds enough padding.
|
|
|
|
#define KVZ_IPOL_MAX_INPUT_SIZE_LUMA_SIMD ((KVZ_EXT_BLOCK_W_LUMA + 1) * KVZ_EXT_BLOCK_W_LUMA)
|
|
|
|
#define KVZ_IPOL_MAX_INPUT_SIZE_CHROMA_SIMD ((KVZ_EXT_BLOCK_W_CHROMA + 3) * KVZ_EXT_BLOCK_W_CHROMA)
|
|
|
|
#define KVZ_IPOL_MAX_IM_SIZE_LUMA_SIMD ((KVZ_EXT_BLOCK_W_LUMA + 1) * LCU_WIDTH)
|
|
|
|
#define KVZ_IPOL_MAX_IM_SIZE_CHROMA_SIMD ((KVZ_EXT_BLOCK_W_CHROMA + 3) * LCU_WIDTH_C)
|
|
|
|
|
|
|
|
// On top of basic interpolation, FME needs one extra
|
|
|
|
// column and row for ME (left and up). Adding the
|
|
|
|
// extra row happens to satisfy AVX2 requirements for
|
|
|
|
// row count. No other extra rows are needed.
|
|
|
|
#define KVZ_FME_MAX_INPUT_SIZE_SIMD ((KVZ_EXT_BLOCK_W_LUMA + 1) * (KVZ_EXT_BLOCK_W_LUMA + 1))
|
2014-11-20 16:38:54 +00:00
|
|
|
|
2015-08-17 08:12:49 +00:00
|
|
|
typedef struct { kvz_pixel *buffer; kvz_pixel *orig_topleft; unsigned stride; unsigned malloc_used; } kvz_extended_block;
|
2014-11-20 16:38:54 +00:00
|
|
|
|
2018-11-04 19:04:17 +00:00
|
|
|
typedef void(ipol_blocks_func)(const encoder_control_t * encoder, kvz_pixel *src, int16_t src_stride, int width, int height,
|
2021-03-06 23:27:55 +00:00
|
|
|
kvz_pixel filtered[4][LCU_LUMA_SIZE], int16_t hor_intermediate[5][KVZ_IPOL_MAX_IM_SIZE_LUMA_SIMD], int8_t fme_level, int16_t hor_first_cols[5][KVZ_EXT_BLOCK_W_LUMA + 1],
|
2018-11-04 19:04:17 +00:00
|
|
|
int8_t sample_off_x, int8_t sample_off_y);
|
2016-07-12 15:03:52 +00:00
|
|
|
|
2021-03-02 17:48:57 +00:00
|
|
|
typedef struct {
|
|
|
|
// Source samples
|
|
|
|
kvz_pixel *src; // Top-left sample
|
|
|
|
int src_w; // Width
|
|
|
|
int src_h; // Height
|
|
|
|
int src_s; // Stride
|
|
|
|
|
|
|
|
// Requested sampling position, base dimensions, and padding
|
|
|
|
int blk_x;
|
|
|
|
int blk_y;
|
|
|
|
int blk_w; // Width
|
|
|
|
int blk_h; // Height
|
|
|
|
int pad_l; // Left
|
|
|
|
int pad_r; // Right
|
|
|
|
int pad_t; // Top
|
|
|
|
int pad_b; // Bottom
|
2021-03-08 14:05:34 +00:00
|
|
|
int pad_b_simd; // "Don't care" rows in the end. Zeroed out.
|
2021-03-02 17:48:57 +00:00
|
|
|
|
|
|
|
// Buffer for possible extrapolation. Free memory provided by the caller.
|
|
|
|
kvz_pixel *buf;
|
|
|
|
|
|
|
|
// Extended block data. These are set by the function.
|
|
|
|
kvz_pixel **ext; // Top-left sample with padding
|
|
|
|
kvz_pixel **ext_origin; // Top-left sample without padding
|
|
|
|
int *ext_s; // Stride
|
|
|
|
} kvz_epol_args;
|
|
|
|
|
2021-03-05 16:14:27 +00:00
|
|
|
typedef void(epol_func)(kvz_epol_args *args);
|
2021-03-02 17:48:57 +00:00
|
|
|
|
2014-11-20 16:38:54 +00:00
|
|
|
|
2021-11-22 08:38:18 +00:00
|
|
|
typedef void(kvz_sample_quarterpel_luma_func)(const encoder_control_t * const encoder, kvz_pixel *src, int16_t src_stride, int width, int height, kvz_pixel *dst, int16_t dst_stride, int8_t hor_flag, int8_t ver_flag, const mv_t mv[2]);
|
|
|
|
typedef void(kvz_sample_octpel_chroma_func)(const encoder_control_t * const encoder, kvz_pixel *src, int16_t src_stride, int width, int height, kvz_pixel *dst, int16_t dst_stride, int8_t hor_flag, int8_t ver_flag, const mv_t mv[2]);
|
2016-04-06 16:55:42 +00:00
|
|
|
|
2021-11-22 08:38:18 +00:00
|
|
|
typedef void(kvz_sample_quarterpel_luma_hi_func)(const encoder_control_t * const encoder, kvz_pixel *src, int16_t src_stride, int width, int height, int16_t *dst, int16_t dst_stride, int8_t hor_flag, int8_t ver_flag, const mv_t mv[2]);
|
|
|
|
typedef void(kvz_sample_octpel_chroma_hi_func)(const encoder_control_t * const encoder, kvz_pixel *src, int16_t src_stride, int width, int height, int16_t *dst, int16_t dst_stride, int8_t hor_flag, int8_t ver_flag, const mv_t mv[2]);
|
2014-11-20 16:38:54 +00:00
|
|
|
|
|
|
|
// Declare function pointers.
|
2018-11-04 19:04:17 +00:00
|
|
|
extern ipol_blocks_func * kvz_filter_hpel_blocks_hor_ver_luma;
|
|
|
|
extern ipol_blocks_func * kvz_filter_hpel_blocks_diag_luma;
|
|
|
|
extern ipol_blocks_func * kvz_filter_qpel_blocks_hor_ver_luma;
|
|
|
|
extern ipol_blocks_func * kvz_filter_qpel_blocks_diag_luma;
|
2015-08-26 08:50:27 +00:00
|
|
|
extern epol_func * kvz_get_extended_block;
|
2016-04-06 16:55:42 +00:00
|
|
|
extern kvz_sample_quarterpel_luma_func * kvz_sample_quarterpel_luma;
|
|
|
|
extern kvz_sample_octpel_chroma_func * kvz_sample_octpel_chroma;
|
2021-03-06 17:46:36 +00:00
|
|
|
extern kvz_sample_quarterpel_luma_hi_func * kvz_sample_quarterpel_luma_hi;
|
|
|
|
extern kvz_sample_octpel_chroma_hi_func * kvz_sample_octpel_chroma_hi;
|
2014-11-20 16:38:54 +00:00
|
|
|
|
|
|
|
|
2015-08-26 08:50:27 +00:00
|
|
|
int kvz_strategy_register_ipol(void* opaque, uint8_t bitdepth);
|
2014-11-20 16:38:54 +00:00
|
|
|
|
|
|
|
|
|
|
|
#define STRATEGIES_IPOL_EXPORTS \
|
2018-11-04 19:04:17 +00:00
|
|
|
{"filter_hpel_blocks_hor_ver_luma", (void**) &kvz_filter_hpel_blocks_hor_ver_luma}, \
|
|
|
|
{"filter_hpel_blocks_diag_luma", (void**) &kvz_filter_hpel_blocks_diag_luma}, \
|
|
|
|
{"filter_qpel_blocks_hor_ver_luma", (void**) &kvz_filter_qpel_blocks_hor_ver_luma}, \
|
|
|
|
{"filter_qpel_blocks_diag_luma", (void**) &kvz_filter_qpel_blocks_diag_luma}, \
|
2016-04-06 16:55:42 +00:00
|
|
|
{"sample_quarterpel_luma", (void**) &kvz_sample_quarterpel_luma}, \
|
|
|
|
{"sample_octpel_chroma", (void**) &kvz_sample_octpel_chroma}, \
|
2021-03-06 17:46:36 +00:00
|
|
|
{"sample_quarterpel_luma_hi", (void**) &kvz_sample_quarterpel_luma_hi}, \
|
|
|
|
{"sample_octpel_chroma_hi", (void**) &kvz_sample_octpel_chroma_hi}, \
|
2015-08-26 08:50:27 +00:00
|
|
|
{"get_extended_block", (void**) &kvz_get_extended_block}, \
|
2014-11-20 16:38:54 +00:00
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
#endif //STRATEGIES_IPOL_H_
|