vp8/common/variance_c.c

   1 /*
   2  *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
   3  *
   4  *  Use of this source code is governed by a BSD-style license
   5  *  that can be found in the LICENSE file in the root of the source
   6  *  tree. An additional intellectual property rights grant can be found
   7  *  in the file PATENTS.  All contributing project authors may
   8  *  be found in the AUTHORS file in the root of the source tree.
   9  */
  10
  11
  12 #include "variance.h"
  13 #include "filter.h"
  14
  15
  16 unsigned int vp8_get_mb_ss_c
  17 (
  18     const short *src_ptr
  19 )
  20 {
  21     unsigned int i = 0, sum = 0;
  22
  23     do
  24     {
  25         sum += (src_ptr[i] * src_ptr[i]);
  26         i++;
  27     }
  28     while (i < 256);
  29
  30     return sum;
  31 }
  32
  33
  34 static void variance(
  35     const unsigned char *src_ptr,
  36     int  source_stride,
  37     const unsigned char *ref_ptr,
  38     int  recon_stride,
  39     int  w,
  40     int  h,
  41     unsigned int *sse,
  42     int *sum)
  43 {
  44     int i, j;
  45     int diff;
  46
  47     *sum = 0;
  48     *sse = 0;
  49
  50     for (i = 0; i < h; i++)
  51     {
  52         for (j = 0; j < w; j++)
  53         {
  54             diff = src_ptr[j] - ref_ptr[j];
  55             *sum += diff;
  56             *sse += diff * diff;
  57         }
  58
  59         src_ptr += source_stride;
  60         ref_ptr += recon_stride;
  61     }
  62 }
  63
  64
  65 unsigned int vp8_variance16x16_c(
  66     const unsigned char *src_ptr,
  67     int  source_stride,
  68     const unsigned char *ref_ptr,
  69     int  recon_stride,
  70     unsigned int *sse)
  71 {
  72     unsigned int var;
  73     int avg;
  74
  75
  76     variance(src_ptr, source_stride, ref_ptr, recon_stride, 16, 16, &var, &avg);
  77     *sse = var;
  78     return (var - ((unsigned int)(avg * avg) >> 8));
  79 }
  80
  81 unsigned int vp8_variance8x16_c(
  82     const unsigned char *src_ptr,
  83     int  source_stride,
  84     const unsigned char *ref_ptr,
  85     int  recon_stride,
  86     unsigned int *sse)
  87 {
  88     unsigned int var;
  89     int avg;
  90
  91
  92     variance(src_ptr, source_stride, ref_ptr, recon_stride, 8, 16, &var, &avg);
  93     *sse = var;
  94     return (var - ((unsigned int)(avg * avg) >> 7));
  95 }
  96
  97 unsigned int vp8_variance16x8_c(
  98     const unsigned char *src_ptr,
  99     int  source_stride,
 100     const unsigned char *ref_ptr,
 101     int  recon_stride,
 102     unsigned int *sse)
 103 {
 104     unsigned int var;
 105     int avg;
 106
 107
 108     variance(src_ptr, source_stride, ref_ptr, recon_stride, 16, 8, &var, &avg);
 109     *sse = var;
 110     return (var - ((unsigned int)(avg * avg) >> 7));
 111 }
 112
 113
 114 unsigned int vp8_variance8x8_c(
 115     const unsigned char *src_ptr,
 116     int  source_stride,
 117     const unsigned char *ref_ptr,
 118     int  recon_stride,
 119     unsigned int *sse)
 120 {
 121     unsigned int var;
 122     int avg;
 123
 124
 125     variance(src_ptr, source_stride, ref_ptr, recon_stride, 8, 8, &var, &avg);
 126     *sse = var;
 127     return (var - ((unsigned int)(avg * avg) >> 6));
 128 }
 129
 130 unsigned int vp8_variance4x4_c(
 131     const unsigned char *src_ptr,
 132     int  source_stride,
 133     const unsigned char *ref_ptr,
 134     int  recon_stride,
 135     unsigned int *sse)
 136 {
 137     unsigned int var;
 138     int avg;
 139
 140
 141     variance(src_ptr, source_stride, ref_ptr, recon_stride, 4, 4, &var, &avg);
 142     *sse = var;
 143     return (var - ((unsigned int)(avg * avg) >> 4));
 144 }
 145
 146
 147 unsigned int vp8_mse16x16_c(
 148     const unsigned char *src_ptr,
 149     int  source_stride,
 150     const unsigned char *ref_ptr,
 151     int  recon_stride,
 152     unsigned int *sse)
 153 {
 154     unsigned int var;
 155     int avg;
 156
 157     variance(src_ptr, source_stride, ref_ptr, recon_stride, 16, 16, &var, &avg);
 158     *sse = var;
 159     return var;
 160 }
 161
 162
 163 /****************************************************************************
 164  *
 165  *  ROUTINE       : filter_block2d_bil_first_pass
 166  *
 167  *  INPUTS        : UINT8  *src_ptr          : Pointer to source block.
 168  *                  UINT32 src_pixels_per_line : Stride of input block.
 169  *                  UINT32 pixel_step        : Offset between filter input samples (see notes).
 170  *                  UINT32 output_height     : Input block height.
 171  *                  UINT32 output_width      : Input block width.
 172  *                  INT32  *vp8_filter          : Array of 2 bi-linear filter taps.
 173  *
 174  *  OUTPUTS       : INT32 *output_ptr        : Pointer to filtered block.
 175  *
 176  *  RETURNS       : void
 177  *
 178  *  FUNCTION      : Applies a 1-D 2-tap bi-linear filter to the source block in
 179  *                  either horizontal or vertical direction to produce the
 180  *                  filtered output block. Used to implement first-pass
 181  *                  of 2-D separable filter.
 182  *
 183  *  SPECIAL NOTES : Produces INT32 output to retain precision for next pass.
 184  *                  Two filter taps should sum to VP8_FILTER_WEIGHT.
 185  *                  pixel_step defines whether the filter is applied
 186  *                  horizontally (pixel_step=1) or vertically (pixel_step=stride).
 187  *                  It defines the offset required to move from one input
 188  *                  to the next.
 189  *
 190  ****************************************************************************/
 191 static void var_filter_block2d_bil_first_pass
 192 (
 193     const unsigned char *src_ptr,
 194     unsigned short *output_ptr,
 195     unsigned int src_pixels_per_line,
 196     int pixel_step,
 197     unsigned int output_height,
 198     unsigned int output_width,
 199     const short *vp8_filter
 200 )
 201 {
 202     unsigned int i, j;
 203
 204     for (i = 0; i < output_height; i++)
 205     {
 206         for (j = 0; j < output_width; j++)
 207         {
 208             // Apply bilinear filter
 209             output_ptr[j] = (((int)src_ptr[0]          * vp8_filter[0]) +
 210                              ((int)src_ptr[pixel_step] * vp8_filter[1]) +
 211                              (VP8_FILTER_WEIGHT / 2)) >> VP8_FILTER_SHIFT;
 212             src_ptr++;
 213         }
 214
 215         // Next row...
 216         src_ptr    += src_pixels_per_line - output_width;
 217         output_ptr += output_width;
 218     }
 219 }
 220
 221 /****************************************************************************
 222  *
 223  *  ROUTINE       : filter_block2d_bil_second_pass
 224  *
 225  *  INPUTS        : INT32  *src_ptr          : Pointer to source block.
 226  *                  UINT32 src_pixels_per_line : Stride of input block.
 227  *                  UINT32 pixel_step        : Offset between filter input samples (see notes).
 228  *                  UINT32 output_height     : Input block height.
 229  *                  UINT32 output_width      : Input block width.
 230  *                  INT32  *vp8_filter          : Array of 2 bi-linear filter taps.
 231  *
 232  *  OUTPUTS       : UINT16 *output_ptr       : Pointer to filtered block.
 233  *
 234  *  RETURNS       : void
 235  *
 236  *  FUNCTION      : Applies a 1-D 2-tap bi-linear filter to the source block in
 237  *                  either horizontal or vertical direction to produce the
 238  *                  filtered output block. Used to implement second-pass
 239  *                  of 2-D separable filter.
 240  *
 241  *  SPECIAL NOTES : Requires 32-bit input as produced by filter_block2d_bil_first_pass.
 242  *                  Two filter taps should sum to VP8_FILTER_WEIGHT.
 243  *                  pixel_step defines whether the filter is applied
 244  *                  horizontally (pixel_step=1) or vertically (pixel_step=stride).
 245  *                  It defines the offset required to move from one input
 246  *                  to the next.
 247  *
 248  ****************************************************************************/
 249 static void var_filter_block2d_bil_second_pass
 250 (
 251     const unsigned short *src_ptr,
 252     unsigned char  *output_ptr,
 253     unsigned int  src_pixels_per_line,
 254     unsigned int  pixel_step,
 255     unsigned int  output_height,
 256     unsigned int  output_width,
 257     const short *vp8_filter
 258 )
 259 {
 260     unsigned int  i, j;
 261     int  Temp;
 262
 263     for (i = 0; i < output_height; i++)
 264     {
 265         for (j = 0; j < output_width; j++)
 266         {
 267             // Apply filter
 268             Temp = ((int)src_ptr[0]         * vp8_filter[0]) +
 269                    ((int)src_ptr[pixel_step] * vp8_filter[1]) +
 270                    (VP8_FILTER_WEIGHT / 2);
 271             output_ptr[j] = (unsigned int)(Temp >> VP8_FILTER_SHIFT);
 272             src_ptr++;
 273         }
 274
 275         // Next row...
 276         src_ptr    += src_pixels_per_line - output_width;
 277         output_ptr += output_width;
 278     }
 279 }
 280
 281
 282 unsigned int vp8_sub_pixel_variance4x4_c
 283 (
 284     const unsigned char  *src_ptr,
 285     int  src_pixels_per_line,
 286     int  xoffset,
 287     int  yoffset,
 288     const unsigned char *dst_ptr,
 289     int dst_pixels_per_line,
 290     unsigned int *sse
 291 )
 292 {
 293     unsigned char  temp2[20*16];
 294     const short *HFilter, *VFilter;
 295     unsigned short FData3[5*4]; // Temp data bufffer used in filtering
 296
 297     HFilter = vp8_bilinear_filters[xoffset];
 298     VFilter = vp8_bilinear_filters[yoffset];
 299
 300     // First filter 1d Horizontal
 301     var_filter_block2d_bil_first_pass(src_ptr, FData3, src_pixels_per_line, 1, 5, 4, HFilter);
 302
 303     // Now filter Verticaly
 304     var_filter_block2d_bil_second_pass(FData3, temp2, 4,  4,  4,  4, VFilter);
 305
 306     return vp8_variance4x4_c(temp2, 4, dst_ptr, dst_pixels_per_line, sse);
 307 }
 308
 309
 310 unsigned int vp8_sub_pixel_variance8x8_c
 311 (
 312     const unsigned char  *src_ptr,
 313     int  src_pixels_per_line,
 314     int  xoffset,
 315     int  yoffset,
 316     const unsigned char *dst_ptr,
 317     int dst_pixels_per_line,
 318     unsigned int *sse
 319 )
 320 {
 321     unsigned short FData3[9*8]; // Temp data bufffer used in filtering
 322     unsigned char  temp2[20*16];
 323     const short *HFilter, *VFilter;
 324
 325     HFilter = vp8_bilinear_filters[xoffset];
 326     VFilter = vp8_bilinear_filters[yoffset];
 327
 328     var_filter_block2d_bil_first_pass(src_ptr, FData3, src_pixels_per_line, 1, 9, 8, HFilter);
 329     var_filter_block2d_bil_second_pass(FData3, temp2, 8, 8, 8, 8, VFilter);
 330
 331     return vp8_variance8x8_c(temp2, 8, dst_ptr, dst_pixels_per_line, sse);
 332 }
 333
 334 unsigned int vp8_sub_pixel_variance16x16_c
 335 (
 336     const unsigned char  *src_ptr,
 337     int  src_pixels_per_line,
 338     int  xoffset,
 339     int  yoffset,
 340     const unsigned char *dst_ptr,
 341     int dst_pixels_per_line,
 342     unsigned int *sse
 343 )
 344 {
 345     unsigned short FData3[17*16];   // Temp data bufffer used in filtering
 346     unsigned char  temp2[20*16];
 347     const short *HFilter, *VFilter;
 348
 349     HFilter = vp8_bilinear_filters[xoffset];
 350     VFilter = vp8_bilinear_filters[yoffset];
 351
 352     var_filter_block2d_bil_first_pass(src_ptr, FData3, src_pixels_per_line, 1, 17, 16, HFilter);
 353     var_filter_block2d_bil_second_pass(FData3, temp2, 16, 16, 16, 16, VFilter);
 354
 355     return vp8_variance16x16_c(temp2, 16, dst_ptr, dst_pixels_per_line, sse);
 356 }
 357
 358
 359 unsigned int vp8_variance_halfpixvar16x16_h_c(
 360     const unsigned char *src_ptr,
 361     int  source_stride,
 362     const unsigned char *ref_ptr,
 363     int  recon_stride,
 364     unsigned int *sse)
 365 {
 366     return vp8_sub_pixel_variance16x16_c(src_ptr, source_stride, 4, 0,
 367                                          ref_ptr, recon_stride, sse);
 368 }
 369
 370
 371 unsigned int vp8_variance_halfpixvar16x16_v_c(
 372     const unsigned char *src_ptr,
 373     int  source_stride,
 374     const unsigned char *ref_ptr,
 375     int  recon_stride,
 376     unsigned int *sse)
 377 {
 378     return vp8_sub_pixel_variance16x16_c(src_ptr, source_stride, 0, 4,
 379                                          ref_ptr, recon_stride, sse);
 380 }
 381
 382
 383 unsigned int vp8_variance_halfpixvar16x16_hv_c(
 384     const unsigned char *src_ptr,
 385     int  source_stride,
 386     const unsigned char *ref_ptr,
 387     int  recon_stride,
 388     unsigned int *sse)
 389 {
 390     return vp8_sub_pixel_variance16x16_c(src_ptr, source_stride, 4, 4,
 391                                          ref_ptr, recon_stride, sse);
 392 }
 393
 394
 395 unsigned int vp8_sub_pixel_mse16x16_c
 396 (
 397     const unsigned char  *src_ptr,
 398     int  src_pixels_per_line,
 399     int  xoffset,
 400     int  yoffset,
 401     const unsigned char *dst_ptr,
 402     int dst_pixels_per_line,
 403     unsigned int *sse
 404 )
 405 {
 406     vp8_sub_pixel_variance16x16_c(src_ptr, src_pixels_per_line, xoffset, yoffset, dst_ptr, dst_pixels_per_line, sse);
 407     return *sse;
 408 }
 409
 410 unsigned int vp8_sub_pixel_variance16x8_c
 411 (
 412     const unsigned char  *src_ptr,
 413     int  src_pixels_per_line,
 414     int  xoffset,
 415     int  yoffset,
 416     const unsigned char *dst_ptr,
 417     int dst_pixels_per_line,
 418     unsigned int *sse
 419 )
 420 {
 421     unsigned short FData3[16*9];    // Temp data bufffer used in filtering
 422     unsigned char  temp2[20*16];
 423     const short *HFilter, *VFilter;
 424
 425     HFilter = vp8_bilinear_filters[xoffset];
 426     VFilter = vp8_bilinear_filters[yoffset];
 427
 428     var_filter_block2d_bil_first_pass(src_ptr, FData3, src_pixels_per_line, 1, 9, 16, HFilter);
 429     var_filter_block2d_bil_second_pass(FData3, temp2, 16, 16, 8, 16, VFilter);
 430
 431     return vp8_variance16x8_c(temp2, 16, dst_ptr, dst_pixels_per_line, sse);
 432 }
 433
 434 unsigned int vp8_sub_pixel_variance8x16_c
 435 (
 436     const unsigned char  *src_ptr,
 437     int  src_pixels_per_line,
 438     int  xoffset,
 439     int  yoffset,
 440     const unsigned char *dst_ptr,
 441     int dst_pixels_per_line,
 442     unsigned int *sse
 443 )
 444 {
 445     unsigned short FData3[9*16];    // Temp data bufffer used in filtering
 446     unsigned char  temp2[20*16];
 447     const short *HFilter, *VFilter;
 448
 449
 450     HFilter = vp8_bilinear_filters[xoffset];
 451     VFilter = vp8_bilinear_filters[yoffset];
 452
 453
 454     var_filter_block2d_bil_first_pass(src_ptr, FData3, src_pixels_per_line, 1, 17, 8, HFilter);
 455     var_filter_block2d_bil_second_pass(FData3, temp2, 8, 8, 16, 8, VFilter);
 456
 457     return vp8_variance8x16_c(temp2, 8, dst_ptr, dst_pixels_per_line, sse);
 458 }