uvg266/src/picture.c

884 lines
26 KiB
C
Raw Normal View History

/**
2013-09-18 14:29:30 +00:00
* \file
*
* \author Marko Viitanen ( fador@iki.fi ),
* Tampere University of Technology,
* Department of Pervasive Computing.
* \author Ari Koivula ( ari@koivu.la ),
* Tampere University of Technology,
* Department of Pervasive Computing.
*/
#include "picture.h"
#include <string.h>
#include <stdio.h>
#include <stdlib.h>
2013-09-20 08:07:31 +00:00
#include <math.h>
#include "sao.h"
2013-09-20 08:07:31 +00:00
#define PSNRMAX (255.0 * 255.0)
2013-10-23 12:14:26 +00:00
/**
* \brief Set block skipped
* \param pic picture to use
* \param x_scu x SCU position (smallest CU)
* \param y_scu y SCU position (smallest CU)
* \param depth current CU depth
* \param skipped skipped flag
*/
void picture_set_block_skipped(picture *pic, uint32_t x_scu, uint32_t y_scu,
uint8_t depth, int8_t skipped)
{
uint32_t x, y;
int width_in_scu = pic->width_in_lcu << MAX_DEPTH;
int block_scu_width = (LCU_WIDTH >> depth) / (LCU_WIDTH >> MAX_DEPTH);
for (y = y_scu; y < y_scu + block_scu_width; ++y) {
int cu_row = y * width_in_scu;
for (x = x_scu; x < x_scu + block_scu_width; ++x) {
pic->cu_array[MAX_DEPTH][cu_row + x].skipped = skipped;
}
}
}
/**
* \brief Set block residual status
* \param pic picture to use
* \param x_scu x SCU position (smallest CU)
* \param y_scu y SCU position (smallest CU)
* \param depth current CU depth
* \param coeff_y residual status
*/
void picture_set_block_residual(picture *pic, uint32_t x_scu, uint32_t y_scu,
uint8_t depth, int8_t coeff_y)
{
uint32_t x, y;
int width_in_scu = pic->width_in_lcu << MAX_DEPTH;
int block_scu_width = (LCU_WIDTH >> depth) / (LCU_WIDTH >> MAX_DEPTH);
for (y = y_scu; y < y_scu + block_scu_width; ++y) {
int cu_row = y * width_in_scu;
for (x = x_scu; x < x_scu + block_scu_width; ++x) {
pic->cu_array[MAX_DEPTH][cu_row + x].coeff_y = coeff_y;
}
}
}
/**
* \brief BLock Image Transfer from one buffer to another.
*
* It's a stupidly simple loop that copies pixels.
*
* \param orig Start of the originating buffer.
* \param dst Start of the destination buffer.
* \param width Width of the copied region.
* \param height Height of the copied region.
* \param orig_stride Width of a row in the originating buffer.
* \param dst_stride Width of a row in the destination buffer.
*
* This should be inlined, but it's defined here for now to see if Visual
* Studios LTCG will inline it.
*/
void picture_blit_pixels(const pixel *orig, pixel *dst,
unsigned width, unsigned height,
unsigned orig_stride, unsigned dst_stride)
{
unsigned y, x;
const pixel *borig = orig;
const pixel *bdst = dst;
for (y = 0; y < height; ++y) {
for (x = 0; x < width; ++x) {
dst[x] = orig[x];
}
// Move pointers to the next row.
orig += orig_stride;
dst += dst_stride;
}
}
2013-09-20 08:07:31 +00:00
/**
* \brief Set block coded status
* \param pic picture to use
* \param x_scu x SCU position (smallest CU)
* \param y_scu y SCU position (smallest CU)
* \param depth current CU depth
* \param coded coded status
*/
void picture_set_block_coded(picture *pic, uint32_t x_scu, uint32_t y_scu,
uint8_t depth, int8_t coded)
{
2013-09-20 08:07:31 +00:00
uint32_t x, y, d;
int width_in_scu = pic->width_in_lcu << MAX_DEPTH;
int block_scu_width = (LCU_WIDTH >> depth) / (LCU_WIDTH >> MAX_DEPTH);
for (y = y_scu; y < y_scu + block_scu_width; ++y) {
int cu_row = y * width_in_scu;
for (x = x_scu; x < x_scu + block_scu_width; ++x) {
for (d = 0; d < MAX_DEPTH + 1; ++d) {
pic->cu_array[d][cu_row + x].coded = coded;
}
}
}
}
2013-09-20 08:07:31 +00:00
/**
* \brief Allocate memory for picture_list
* \param size initial array size
* \return picture_list pointer, NULL on failure
*/
picture_list * picture_list_init(int size)
{
picture_list *list = (picture_list *)malloc(sizeof(picture_list));
list->size = size;
2013-09-20 08:07:31 +00:00
if (size > 0) {
list->pics = (picture**)malloc(sizeof(picture*) * size);
}
list->used_size = 0;
return list;
}
2013-09-20 08:07:31 +00:00
/**
* \brief Resize picture_list array
* \param list picture_list pointer
* \param size new array size
* \return 1 on success, 0 on failure
*/
int picture_list_resize(picture_list *list, int size)
{
unsigned int i;
picture** old_pics = NULL;
2013-09-20 08:07:31 +00:00
// No need to do anything when resizing to same size
if (size == list->size) {
return 1;
}
2013-09-20 08:07:31 +00:00
// Save the old list
if (list->used_size > 0) {
old_pics = list->pics;
}
2013-09-20 08:07:31 +00:00
// allocate space for the new list
list->pics = (picture**)malloc(sizeof(picture*)*size);
2013-09-20 08:07:31 +00:00
// Copy everything from the old list to the new if needed.
if (old_pics != NULL) {
for (i = 0; i < list->used_size; ++i) {
list->pics[i] = old_pics[i];
}
free(old_pics);
}
return 1;
}
2013-09-20 08:07:31 +00:00
/**
* \brief Free memory allocated to the picture_list
* \param list picture_list pointer
* \return 1 on success, 0 on failure
*/
int picture_list_destroy(picture_list *list)
{
unsigned int i;
2013-09-20 08:07:31 +00:00
if (list->used_size > 0) {
for (i = 0; i < list->used_size; ++i) {
picture_destroy(list->pics[i]);
}
}
2013-09-20 08:07:31 +00:00
if (list->size > 0) {
free(list->pics);
}
free(list);
return 1;
}
2013-09-20 08:07:31 +00:00
/**
* \brief Add picture to picturelist
* \param pic picture pointer to add
* \param picture_list list to use
* \return 1 on success
*/
int picture_list_add(picture_list *list,picture* pic)
{
2013-09-20 08:07:31 +00:00
if (list->size == list->used_size) {
if (!picture_list_resize(list, list->size*2)) return 0;
}
list->pics[list->used_size] = pic;
list->used_size++;
return 1;
}
2013-09-20 08:07:31 +00:00
/**
* \brief Add picture to picturelist
* \param pic picture pointer to add
* \param picture_list list to use
* \return 1 on success
*/
int picture_list_rem(picture_list *list, int n, int8_t destroy)
{
int i;
2013-09-20 08:07:31 +00:00
// Must be within list boundaries
if ((unsigned)n >= list->used_size)
{
return 0;
}
2013-09-20 08:07:31 +00:00
if (destroy) {
picture_destroy(list->pics[n]);
free(list->pics[n]);
}
2013-09-20 08:07:31 +00:00
// The last item is easy to remove
if (n == list->used_size - 1) {
list->pics[n] = NULL;
list->used_size--;
2013-09-20 08:07:31 +00:00
} else {
// Shift all following pics one backward in the list
for (i = n; (unsigned)n < list->used_size - 1; ++n) {
list->pics[n] = list->pics[n + 1];
}
2013-09-20 08:07:31 +00:00
list->pics[list->used_size - 1] = NULL;
list->used_size--;
}
return 1;
}
2013-09-20 08:07:31 +00:00
/**
* \brief Allocate new picture
* \param pic picture pointer
* \return picture pointer
*/
picture *picture_init(int32_t width, int32_t height,
int32_t width_in_lcu, int32_t height_in_lcu)
{
picture *pic = (picture *)malloc(sizeof(picture));
unsigned int luma_size = width * height;
unsigned int chroma_size = luma_size / 4;
int i = 0;
2013-09-20 08:07:31 +00:00
if (!pic) return 0;
memset(pic, 0, sizeof(picture));
pic->width = width;
pic->height = height;
2013-09-20 08:07:31 +00:00
pic->width_in_lcu = width_in_lcu;
pic->height_in_lcu = height_in_lcu;
pic->referenced = 0;
2013-09-20 08:07:31 +00:00
// Allocate buffers
pic->y_data = MALLOC(pixel, luma_size);
pic->u_data = MALLOC(pixel, chroma_size);
pic->v_data = MALLOC(pixel, chroma_size);
2013-09-20 08:07:31 +00:00
// Reconstruction buffers
pic->y_recdata = MALLOC(pixel, luma_size);
pic->u_recdata = MALLOC(pixel, chroma_size);
pic->v_recdata = MALLOC(pixel, chroma_size);
memset(pic->u_recdata, 128, (chroma_size));
memset(pic->v_recdata, 128, (chroma_size));
2013-09-20 08:07:31 +00:00
// Allocate memory for CU info 2D array
// TODO: we don't need this much space on LCU...MAX_DEPTH-1
2013-09-20 09:49:44 +00:00
pic->cu_array = (cu_info**)malloc(sizeof(cu_info*) * (MAX_DEPTH + 1));
2013-09-20 08:07:31 +00:00
for (i = 0; i <= MAX_DEPTH; ++i) {
// Allocate height_in_scu x width_in_scu x sizeof(CU_info)
unsigned height_in_scu = height_in_lcu << MAX_DEPTH;
unsigned width_in_scu = width_in_lcu << MAX_DEPTH;
unsigned cu_array_size = height_in_scu * width_in_scu;
2013-09-20 09:49:44 +00:00
pic->cu_array[i] = (cu_info*)malloc(sizeof(cu_info) * cu_array_size);
memset(pic->cu_array[i], 0, sizeof(cu_info) * cu_array_size);
}
pic->coeff_y = NULL; pic->coeff_u = NULL; pic->coeff_v = NULL;
pic->pred_y = NULL; pic->pred_u = NULL; pic->pred_v = NULL;
2013-10-15 14:56:50 +00:00
pic->slice_sao_luma_flag = 1;
pic->slice_sao_chroma_flag = 1;
pic->sao_luma = MALLOC(sao_info, width_in_lcu * height_in_lcu);
pic->sao_chroma = MALLOC(sao_info, width_in_lcu * height_in_lcu);
return pic;
}
2013-09-20 08:07:31 +00:00
/**
* \brief Free memory allocated to picture
* \param pic picture pointer
* \return 1 on success, 0 on failure
*/
int picture_destroy(picture *pic)
{
int i;
free(pic->u_data);
free(pic->v_data);
free(pic->y_data);
pic->y_data = pic->u_data = pic->v_data = NULL;
free(pic->y_recdata);
free(pic->u_recdata);
free(pic->v_recdata);
pic->y_recdata = pic->u_recdata = pic->v_recdata = NULL;
2013-09-20 08:07:31 +00:00
for (i = 0; i <= MAX_DEPTH; ++i)
{
free(pic->cu_array[i]);
pic->cu_array[i] = NULL;
}
free(pic->cu_array);
pic->cu_array = NULL;
FREE_POINTER(pic->coeff_y);
FREE_POINTER(pic->coeff_u);
FREE_POINTER(pic->coeff_v);
FREE_POINTER(pic->pred_y);
FREE_POINTER(pic->pred_u);
FREE_POINTER(pic->pred_v);
2013-10-15 14:56:50 +00:00
FREE_POINTER(pic->sao_luma);
FREE_POINTER(pic->sao_chroma);
return 1;
}
2013-09-20 08:07:31 +00:00
/**
* \brief Calculates image PSNR value
*/
double image_psnr(pixel *frame1, pixel *frame2, int32_t x, int32_t y)
2013-09-20 08:07:31 +00:00
{
uint64_t error_sum = 0;
int32_t error = 0;
int32_t pixels = x * y;
int32_t i;
for (i = 0; i < pixels; ++i) {
error = frame1[i] - frame2[i];
error_sum += error * error;
}
2013-09-20 08:07:31 +00:00
// Avoid division by zero
if (error_sum == 0) return 99.0;
2013-09-20 08:07:31 +00:00
return 10 * log10((pixels * PSNRMAX) / ((double)error_sum));
}
2013-09-20 08:07:31 +00:00
/**
* \brief Calculate SATD between two 8x8 blocks inside bigger arrays.
2013-09-20 08:07:31 +00:00
*/
unsigned satd_16bit_8x8_general(pixel *piOrg, int32_t iStrideOrg, pixel *piCur, int32_t iStrideCur)
{
int32_t k, i, j, jj, sad=0;
int32_t diff[64], m1[8][8], m2[8][8], m3[8][8];
2013-09-20 08:07:31 +00:00
for (k = 0; k < 64; k += 8) {
diff[k+0] = piOrg[0] - piCur[0];
diff[k+1] = piOrg[1] - piCur[1];
diff[k+2] = piOrg[2] - piCur[2];
diff[k+3] = piOrg[3] - piCur[3];
diff[k+4] = piOrg[4] - piCur[4];
diff[k+5] = piOrg[5] - piCur[5];
diff[k+6] = piOrg[6] - piCur[6];
diff[k+7] = piOrg[7] - piCur[7];
piCur += iStrideCur;
piOrg += iStrideOrg;
}
2013-09-20 08:07:31 +00:00
// horizontal
for (j = 0; j < 8; ++j) {
jj = j << 3;
m2[j][0] = diff[jj ] + diff[jj+4];
m2[j][1] = diff[jj+1] + diff[jj+5];
m2[j][2] = diff[jj+2] + diff[jj+6];
m2[j][3] = diff[jj+3] + diff[jj+7];
m2[j][4] = diff[jj ] - diff[jj+4];
m2[j][5] = diff[jj+1] - diff[jj+5];
m2[j][6] = diff[jj+2] - diff[jj+6];
m2[j][7] = diff[jj+3] - diff[jj+7];
m1[j][0] = m2[j][0] + m2[j][2];
m1[j][1] = m2[j][1] + m2[j][3];
m1[j][2] = m2[j][0] - m2[j][2];
m1[j][3] = m2[j][1] - m2[j][3];
m1[j][4] = m2[j][4] + m2[j][6];
m1[j][5] = m2[j][5] + m2[j][7];
m1[j][6] = m2[j][4] - m2[j][6];
m1[j][7] = m2[j][5] - m2[j][7];
m2[j][0] = m1[j][0] + m1[j][1];
m2[j][1] = m1[j][0] - m1[j][1];
m2[j][2] = m1[j][2] + m1[j][3];
m2[j][3] = m1[j][2] - m1[j][3];
m2[j][4] = m1[j][4] + m1[j][5];
m2[j][5] = m1[j][4] - m1[j][5];
m2[j][6] = m1[j][6] + m1[j][7];
m2[j][7] = m1[j][6] - m1[j][7];
}
2013-09-20 08:07:31 +00:00
// vertical
for (i = 0; i < 8; ++i) {
m3[0][i] = m2[0][i] + m2[4][i];
m3[1][i] = m2[1][i] + m2[5][i];
m3[2][i] = m2[2][i] + m2[6][i];
m3[3][i] = m2[3][i] + m2[7][i];
m3[4][i] = m2[0][i] - m2[4][i];
m3[5][i] = m2[1][i] - m2[5][i];
m3[6][i] = m2[2][i] - m2[6][i];
m3[7][i] = m2[3][i] - m2[7][i];
m1[0][i] = m3[0][i] + m3[2][i];
m1[1][i] = m3[1][i] + m3[3][i];
m1[2][i] = m3[0][i] - m3[2][i];
m1[3][i] = m3[1][i] - m3[3][i];
m1[4][i] = m3[4][i] + m3[6][i];
m1[5][i] = m3[5][i] + m3[7][i];
m1[6][i] = m3[4][i] - m3[6][i];
m1[7][i] = m3[5][i] - m3[7][i];
m2[0][i] = m1[0][i] + m1[1][i];
m2[1][i] = m1[0][i] - m1[1][i];
m2[2][i] = m1[2][i] + m1[3][i];
m2[3][i] = m1[2][i] - m1[3][i];
m2[4][i] = m1[4][i] + m1[5][i];
m2[5][i] = m1[4][i] - m1[5][i];
m2[6][i] = m1[6][i] + m1[7][i];
m2[7][i] = m1[6][i] - m1[7][i];
}
2013-09-20 08:07:31 +00:00
for (i = 0; i < 8; ++i) {
for (j = 0; j < 8; ++j) {
sad += abs(m2[i][j]);
}
}
2013-09-20 08:07:31 +00:00
sad = (sad + 2) >> 2;
return sad;
}
// Function macro for defining hadamart calculating functions
// for fixed size blocks. They calculate hadamart for integer
// multiples of 8x8 with the 8x8 hadamart function.
#define SATD_NXN(n, pixel_type, suffix) \
unsigned satd_ ## suffix ## _ ## n ## x ## n( \
pixel_type *block1, pixel_type *block2) \
{ \
unsigned y, x; \
unsigned sum = 0; \
for (y = 0; y < (n); y += 8) { \
unsigned row = y * (n); \
for (x = 0; x < (n); x += 8) { \
sum += satd_16bit_8x8_general(&block1[row + x], (n), &block2[row + x], (n)); \
} \
} \
return sum; \
}
// These macros define sadt_16bit_NxN for N = 8, 16, 32, 64
SATD_NXN(8, pixel, 16bit)
SATD_NXN(16, pixel, 16bit)
SATD_NXN(32, pixel, 16bit)
SATD_NXN(64, pixel, 16bit)
// Function macro for defining SAD calculating functions
// for fixed size blocks.
#define SAD_NXN(n, pixel_type, suffix) \
unsigned sad_ ## suffix ## _ ## n ## x ## n( \
pixel_type *block1, pixel_type *block2) \
{ \
unsigned x, y, row; \
unsigned sum = 0; \
for(y = 0; y < (n); y++) { \
row = y * (n); \
for (x = 0; x < (n); ++x) { \
sum += abs(block1[row + x] - block2[row + x]); \
} \
} \
return sum; \
}
// These macros define sad_16bit_nxn functions for n = 4, 8, 16, 32, 64
// with function signatures of cost_16bit_nxn_func.
// They are used through get_sad_16bit_nxn_func.
SAD_NXN(4, pixel, 16bit)
SAD_NXN(8, pixel, 16bit)
SAD_NXN(16, pixel, 16bit)
SAD_NXN(32, pixel, 16bit)
SAD_NXN(64, pixel, 16bit)
2013-09-20 08:07:31 +00:00
/**
* \brief Get a function that calculates SATD for NxN block.
*
* \param n Width of the region for which SATD is calculated.
*
* \returns Pointer to cost_16bit_nxn_func.
2013-09-20 08:07:31 +00:00
*/
cost_16bit_nxn_func get_satd_16bit_nxn_func(unsigned n)
{
switch (n) {
case 8:
return &satd_16bit_8x8;
case 16:
return &satd_16bit_16x16;
case 32:
return &satd_16bit_32x32;
case 64:
return &satd_16bit_64x64;
default:
return NULL;
}
}
2013-09-20 08:07:31 +00:00
/**
* \brief Get a function that calculates SAD for NxN block.
*
* \param n Width of the region for which SAD is calculated.
*
* \returns Pointer to cost_16bit_nxn_func.
2013-09-20 08:07:31 +00:00
*/
cost_16bit_nxn_func get_sad_16bit_nxn_func(unsigned n)
{
switch (n) {
case 4:
return &sad_16bit_4x4;
case 8:
return &sad_16bit_8x8;
case 16:
return &sad_16bit_16x16;
case 32:
return &sad_16bit_32x32;
case 64:
return &sad_16bit_64x64;
default:
return NULL;
}
}
2013-09-20 08:07:31 +00:00
/**
* \brief Calculate SATD for NxN block of size N.
*
* \param block1 Start of the first block.
* \param block2 Start of the second block.
* \param n Width of the region for which SAD is calculated.
*
* \returns Sum of Absolute Transformed Differences (SATD)
2013-09-20 08:07:31 +00:00
*/
unsigned satd_nxn_16bit(pixel *block1, pixel *block2, unsigned n)
{
cost_16bit_nxn_func sad_func = get_satd_16bit_nxn_func(n);
return sad_func(block1, block2);
}
2013-09-20 08:07:31 +00:00
/**
* \brief Calculate SAD for NxN block of size N.
*
* \param block1 Start of the first block.
* \param block2 Start of the second block.
* \param n Width of the region for which SAD is calculated.
*
* \returns Sum of Absolute Differences
2013-09-20 08:07:31 +00:00
*/
unsigned sad_nxn_16bit(pixel *block1, pixel *block2, unsigned n)
{
cost_16bit_nxn_func sad_func = get_sad_16bit_nxn_func(n);
if (sad_func) {
return sad_func(block1, block2);
} else {
unsigned row, x;
unsigned sum = 0;
for (row = 0; row < n; row += n) {
for (x = 0; x < n; ++x) {
sum += abs(block1[row + x] - block2[row + x]);
}
}
return sum;
}
}
/**
* \brief Diagonally interpolate SAD outside the frame.
*
* \param data1 Starting point of the first picture.
* \param data2 Starting point of the second picture.
* \param width Width of the region for which SAD is calculated.
* \param height Height of the region for which SAD is calculated.
* \param width Width of the pixel array.
*
* \returns Sum of Absolute Differences
*/
unsigned cor_sad(const pixel *pic_data, const pixel *ref_data,
int block_width, int block_height, unsigned width)
{
pixel ref = *ref_data;
int x, y;
unsigned sad = 0;
for (y = 0; y < block_height; ++y) {
for (x = 0; x < block_width; ++x) {
sad += abs(pic_data[y * width + x] - ref);
}
}
return sad;
}
/**
* \brief Vertically interpolate SAD outside the frame.
*
* \param data1 Starting point of the first picture.
* \param data2 Starting point of the second picture.
* \param width Width of the region for which SAD is calculated.
* \param height Height of the region for which SAD is calculated.
* \param width Width of the pixel array.
*
* \returns Sum of Absolute Differences
*/
unsigned ver_sad(const pixel *pic_data, const pixel *ref_data,
int block_width, int block_height, unsigned width)
{
int x, y;
unsigned sad = 0;
for (y = 0; y < block_height; ++y) {
for (x = 0; x < block_width; ++x) {
sad += abs(pic_data[y * width + x] - ref_data[x]);
}
}
return sad;
}
/**
* \brief Horizontally interpolate SAD outside the frame.
*
* \param data1 Starting point of the first picture.
* \param data2 Starting point of the second picture.
* \param width Width of the region for which SAD is calculated.
* \param height Height of the region for which SAD is calculated.
* \param width Width of the pixel array.
*
* \returns Sum of Absolute Differences
*/
unsigned hor_sad(const pixel *pic_data, const pixel *ref_data,
int block_width, int block_height, unsigned width)
{
int x, y;
unsigned sad = 0;
for (y = 0; y < block_height; ++y) {
for (x = 0; x < block_width; ++x) {
sad += abs(pic_data[y * width + x] - ref_data[y * width]);
}
}
return sad;
}
/**
2013-09-20 08:07:31 +00:00
* \brief Calculate Sum of Absolute Differences (SAD)
*
* Calculate Sum of Absolute Differences (SAD) between two rectangular regions
* located in arbitrary points in the picture.
*
* \param data1 Starting point of the first picture.
* \param data2 Starting point of the second picture.
* \param width Width of the region for which SAD is calculated.
* \param height Height of the region for which SAD is calculated.
* \param stride Width of the pixel array.
*
2013-09-20 08:07:31 +00:00
* \returns Sum of Absolute Differences
*/
unsigned reg_sad(const pixel *data1, const pixel *data2,
int width, int height, unsigned stride)
{
int y, x;
unsigned sad = 0;
for (y = 0; y < height; ++y) {
for (x = 0; x < width; ++x) {
sad += abs((int)data1[y * stride + x] - (int)data2[y * stride + x]);
}
}
return sad;
}
/**
* \brief Handle special cases of comparing blocks that are not completely
* inside the frame.
*
* \param pic First frame.
* \param ref Second frame.
* \param pic_x X coordinate of the first block.
* \param pic_y Y coordinate of the first block.
* \param ref_x X coordinate of the second block.
* \param ref_y Y coordinate of the second block.
* \param block_width Width of the blocks.
* \param block_height Height of the blocks.
*/
unsigned interpolated_sad(const picture *pic, const picture *ref,
int pic_x, int pic_y, int ref_x, int ref_y,
int block_width, int block_height)
{
pixel *pic_data, *ref_data;
int width = pic->width;
int height = pic->height;
// These are the number of pixels by how far the movement vector points
// outside the frame. They are always >= 0. If all of them are 0, the
// movement vector doesn't point outside the frame.
int left = (ref_x < 0) ? -ref_x : 0;
int top = (ref_y < 0) ? -ref_y : 0;
int right = (ref_x + block_width > width) ? ref_x + block_width - width : 0;
int bottom = (ref_y + block_height > height) ? ref_y + block_height - height : 0;
unsigned result = 0;
// Center picture to the current block and reference to the point where
// movement vector is pointing to. That point might be outside the buffer,
// but that is ok because we project the movement vector to the buffer
// before dereferencing the pointer.
pic_data = &pic->y_data[pic_y * width + pic_x];
ref_data = &ref->y_data[ref_y * width + ref_x];
// The handling of movement vectors that point outside the picture is done
// in the following way.
// - Correct the index of ref_data so that it points to the top-left
// of the area we want to compare against.
// - Correct the index of pic_data to point inside the current block, so
// that we compare the right part of the block to the ref_data.
// - Reduce block_width and block_height so that the the size of the area
// being compared is correct.
if (top && left) {
result += cor_sad(pic_data,
&ref_data[top * width + left],
left, top, width);
result += ver_sad(&pic_data[left],
&ref_data[top * width + left],
block_width - left, top, width);
result += hor_sad(&pic_data[top * width],
&ref_data[top * width + left],
left, block_height - top, width);
result += reg_sad(&pic_data[top * width + left],
&ref_data[top * width + left],
block_width - left, block_height - top, width);
} else if (top && right) {
result += ver_sad(pic_data,
&ref_data[top * width],
block_width - right, top, width);
result += cor_sad(&pic_data[block_width - right],
&ref_data[top * width + (block_width - right - 1)],
right, top, width);
result += reg_sad(&pic_data[top * width],
&ref_data[top * width],
block_width - right, block_height - top, width);
result += hor_sad(&pic_data[top * width + (block_width - right)],
&ref_data[top * width + (block_width - right - 1)],
right, block_height - top, width);
} else if (bottom && left) {
result += hor_sad(pic_data,
&ref_data[left],
left, block_height - bottom, width);
result += reg_sad(&pic_data[left],
&ref_data[left],
block_width - left, block_height - bottom, width);
result += cor_sad(&pic_data[(block_height - bottom) * width],
&ref_data[(block_height - bottom - 1) * width + left],
left, bottom, width);
result += ver_sad(&pic_data[(block_height - bottom) * width + left],
&ref_data[(block_height - bottom - 1) * width + left],
block_width - left, bottom, width);
} else if (bottom && right) {
result += reg_sad(pic_data,
ref_data,
block_width - right, block_height - bottom, width);
result += hor_sad(&pic_data[block_width - right],
&ref_data[block_width - right - 1],
right, block_height - bottom, width);
result += ver_sad(&pic_data[(block_height - bottom) * width],
&ref_data[(block_height - bottom - 1) * width],
block_width - right, bottom, width);
result += cor_sad(&pic_data[(block_height - bottom) * width + block_width - right],
&ref_data[(block_height - bottom - 1) * width + block_width - right - 1],
right, bottom, width);
} else if (top) {
result += ver_sad(pic_data,
&ref_data[top * width],
block_width, top, width);
result += reg_sad(&pic_data[top * width],
&ref_data[top * width],
block_width, block_height - top, width);
} else if (bottom) {
result += reg_sad(pic_data,
ref_data,
block_width, block_height - bottom, width);
result += ver_sad(&pic_data[(block_height - bottom) * width],
&ref_data[(block_height - bottom - 1) * width],
block_width, bottom, width);
} else if (left) {
result += hor_sad(pic_data,
&ref_data[left],
left, block_height, width);
result += reg_sad(&pic_data[left],
&ref_data[left],
block_width - left, block_height, width);
} else if (right) {
result += reg_sad(pic_data,
ref_data,
block_width - right, block_height, width);
result += hor_sad(&pic_data[block_width - right],
&ref_data[block_width - right - 1],
right, block_height, width);
} else {
result += reg_sad(pic_data, ref_data, block_width, block_height, width);
}
return result;
}
/**
* \brief Get Sum of Absolute Differences (SAD) between two blocks in two
* different frames.
*
* \param pic First frame.
* \param ref Second frame.
* \param pic_x X coordinate of the first block.
* \param pic_y Y coordinate of the first block.
* \param ref_x X coordinate of the second block.
* \param ref_y Y coordinate of the second block.
* \param block_width Width of the blocks.
* \param block_height Height of the blocks.
*/
unsigned calc_sad(const picture *pic, const picture *ref,
int pic_x, int pic_y, int ref_x, int ref_y,
int block_width, int block_height)
{
if (ref_x >= 0 && ref_x <= pic->width - block_width &&
ref_y >= 0 && ref_y <= pic->height - block_height)
{
// Reference block is completely inside the frame, so just calculate the
// SAD directly. This is the most common case, which is why it's first.
const pixel *pic_data = &pic->y_data[pic_y * pic->width + pic_x];
const pixel *ref_data = &ref->y_data[ref_y * pic->width + ref_x];
return reg_sad(pic_data, ref_data, block_width, block_height, pic->width);
} else {
// Call a routine that knows how to interpolate pixels outside the frame.
return interpolated_sad(pic, ref, pic_x, pic_y, ref_x, ref_y, block_width, block_height);
}
}