2 * Copyright (c) 2010 The WebM project authors. All Rights Reserved.
4 * Use of this source code is governed by a BSD-style license
5 * that can be found in the LICENSE file in the root of the source
6 * tree. An additional intellectual property rights grant can be found
7 * in the file PATENTS. All contributing project authors may
8 * be found in the AUTHORS file in the root of the source tree.
12 #include "vp8/common/onyxc_int.h"
15 #include "vpx_mem/vpx_mem.h"
16 #include "vpx_scale/yv12extend.h"
17 #include "vpx_scale/vpxscale.h"
18 #include "vp8/common/alloccommon.h"
20 #include "vpx_ports/arm.h"
23 extern void vp8_loop_filter_frame(VP8_COMMON *cm, MACROBLOCKD *mbd, int filt_val);
24 extern void vp8_loop_filter_frame_yonly(VP8_COMMON *cm, MACROBLOCKD *mbd, int filt_val, int sharpness_lvl);
25 extern int vp8_calc_ss_err(YV12_BUFFER_CONFIG *source, YV12_BUFFER_CONFIG *dest, const vp8_variance_rtcd_vtable_t *rtcd);
27 extern void vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(YV12_BUFFER_CONFIG *src_ybc, YV12_BUFFER_CONFIG *dst_ybc);
30 #if CONFIG_RUNTIME_CPU_DETECT
31 #define IF_RTCD(x) (x)
33 #define IF_RTCD(x) NULL
37 (*vp8_yv12_copy_partial_frame_ptr)(YV12_BUFFER_CONFIG *src_ybc,
38 YV12_BUFFER_CONFIG *dst_ybc,
41 vp8_yv12_copy_partial_frame(YV12_BUFFER_CONFIG *src_ybc, YV12_BUFFER_CONFIG *dst_ybc, int Fraction)
43 unsigned char *src_y, *dst_y;
50 border = src_ybc->border;
51 yheight = src_ybc->y_height;
52 ystride = src_ybc->y_stride;
54 linestocopy = (yheight >> (Fraction + 4));
61 yoffset = ystride * ((yheight >> 5) * 16 - 8);
62 src_y = src_ybc->y_buffer + yoffset;
63 dst_y = dst_ybc->y_buffer + yoffset;
65 vpx_memcpy(dst_y, src_y, ystride *(linestocopy + 16));
68 static int vp8_calc_partial_ssl_err(YV12_BUFFER_CONFIG *source, YV12_BUFFER_CONFIG *dest, int Fraction, const vp8_variance_rtcd_vtable_t *rtcd)
72 int srcoffset, dstoffset;
73 unsigned char *src = source->y_buffer;
74 unsigned char *dst = dest->y_buffer;
76 int linestocopy = (source->y_height >> (Fraction + 4));
85 srcoffset = source->y_stride * (dest->y_height >> 5) * 16;
86 dstoffset = dest->y_stride * (dest->y_height >> 5) * 16;
91 // Loop through the Y plane raw and reconstruction data summing (square differences)
92 for (i = 0; i < linestocopy; i += 16)
94 for (j = 0; j < source->y_width; j += 16)
97 Total += VARIANCE_INVOKE(rtcd, mse16x16)(src + j, source->y_stride, dst + j, dest->y_stride, &sse);
100 src += 16 * source->y_stride;
101 dst += 16 * dest->y_stride;
107 extern void vp8_loop_filter_partial_frame
111 int default_filt_lvl,
116 // Enforce a minimum filter level based upon baseline Q
117 static int get_min_filter_level(VP8_COMP *cpi, int base_qindex)
119 int min_filter_level;
121 if (cpi->source_alt_ref_active && cpi->common.refresh_golden_frame && !cpi->common.refresh_alt_ref_frame)
122 min_filter_level = 0;
125 if (base_qindex <= 6)
126 min_filter_level = 0;
127 else if (base_qindex <= 16)
128 min_filter_level = 1;
130 min_filter_level = (base_qindex / 8);
133 return min_filter_level;
136 // Enforce a maximum filter level based upon baseline Q
137 static int get_max_filter_level(VP8_COMP *cpi, int base_qindex)
139 // PGW August 2006: Highest filter values almost always a bad idea
141 // jbb chg: 20100118 - not so any more with this overquant stuff allow high values
142 // with lots of intra coming in.
143 int max_filter_level = MAX_LOOP_FILTER ;//* 3 / 4;
146 if (cpi->twopass.section_intra_rating > 8)
147 max_filter_level = MAX_LOOP_FILTER * 3 / 4;
149 return max_filter_level;
152 void vp8cx_pick_filter_level_fast(YV12_BUFFER_CONFIG *sd, VP8_COMP *cpi)
154 VP8_COMMON *cm = &cpi->common;
158 int min_filter_level = get_min_filter_level(cpi, cm->base_qindex);
159 int max_filter_level = get_max_filter_level(cpi, cm->base_qindex);
161 int best_filt_val = cm->filter_level;
163 // Make a copy of the unfiltered / processed recon buffer
164 //vp8_yv12_copy_frame_ptr( cm->frame_to_show, &cpi->last_frame_uf );
165 vp8_yv12_copy_partial_frame_ptr(cm->frame_to_show, &cpi->last_frame_uf, 3);
167 if (cm->frame_type == KEY_FRAME)
168 cm->sharpness_level = 0;
170 cm->sharpness_level = cpi->oxcf.Sharpness;
172 // Start the search at the previous frame filter level unless it is now out of range.
173 if (cm->filter_level < min_filter_level)
174 cm->filter_level = min_filter_level;
175 else if (cm->filter_level > max_filter_level)
176 cm->filter_level = max_filter_level;
178 filt_val = cm->filter_level;
179 best_filt_val = filt_val;
181 // Set up alternate filter values
183 // Get the err using the previous frame's filter value.
184 vp8_loop_filter_partial_frame(cm, &cpi->mb.e_mbd, filt_val, 0 , 3);
185 cm->last_frame_type = cm->frame_type;
186 cm->last_filter_type = cm->filter_type;
187 cm->last_sharpness_level = cm->sharpness_level;
189 best_err = vp8_calc_partial_ssl_err(sd, cm->frame_to_show, 3, IF_RTCD(&cpi->rtcd.variance));
191 // Re-instate the unfiltered frame
192 vp8_yv12_copy_partial_frame_ptr(&cpi->last_frame_uf, cm->frame_to_show, 3);
194 filt_val -= (1 + ((filt_val > 10) ? 1 : 0));
196 // Search lower filter levels
197 while (filt_val >= min_filter_level)
199 // Apply the loop filter
200 vp8_loop_filter_partial_frame(cm, &cpi->mb.e_mbd, filt_val, 0, 3);
201 cm->last_frame_type = cm->frame_type;
202 cm->last_filter_type = cm->filter_type;
203 cm->last_sharpness_level = cm->sharpness_level;
205 // Get the err for filtered frame
206 filt_err = vp8_calc_partial_ssl_err(sd, cm->frame_to_show, 3, IF_RTCD(&cpi->rtcd.variance));
209 // Re-instate the unfiltered frame
210 vp8_yv12_copy_partial_frame_ptr(&cpi->last_frame_uf, cm->frame_to_show, 3);
213 // Update the best case record or exit loop.
214 if (filt_err < best_err)
217 best_filt_val = filt_val;
222 // Adjust filter level
223 filt_val -= (1 + ((filt_val > 10) ? 1 : 0));
226 // Search up (note that we have already done filt_val = cm->filter_level)
227 filt_val = cm->filter_level + (1 + ((filt_val > 10) ? 1 : 0));
229 if (best_filt_val == cm->filter_level)
231 // Resist raising filter level for very small gains
232 best_err -= (best_err >> 10);
234 while (filt_val < max_filter_level)
236 // Apply the loop filter
237 vp8_loop_filter_partial_frame(cm, &cpi->mb.e_mbd, filt_val, 0, 3);
238 cm->last_frame_type = cm->frame_type;
239 cm->last_filter_type = cm->filter_type;
240 cm->last_sharpness_level = cm->sharpness_level;
242 // Get the err for filtered frame
243 filt_err = vp8_calc_partial_ssl_err(sd, cm->frame_to_show, 3, IF_RTCD(&cpi->rtcd.variance));
245 // Re-instate the unfiltered frame
246 vp8_yv12_copy_partial_frame_ptr(&cpi->last_frame_uf, cm->frame_to_show, 3);
248 // Update the best case record or exit loop.
249 if (filt_err < best_err)
251 // Do not raise filter level if improvement is < 1 part in 4096
252 best_err = filt_err - (filt_err >> 10);
254 best_filt_val = filt_val;
259 // Adjust filter level
260 filt_val += (1 + ((filt_val > 10) ? 1 : 0));
264 cm->filter_level = best_filt_val;
266 if (cm->filter_level < min_filter_level)
267 cm->filter_level = min_filter_level;
269 if (cm->filter_level > max_filter_level)
270 cm->filter_level = max_filter_level;
273 // Stub function for now Alt LF not used
274 void vp8cx_set_alt_lf_level(VP8_COMP *cpi, int filt_val)
276 MACROBLOCKD *mbd = &cpi->mb.e_mbd;
279 mbd->segment_feature_data[MB_LVL_ALT_LF][0] = cpi->segment_feature_data[MB_LVL_ALT_LF][0];
280 mbd->segment_feature_data[MB_LVL_ALT_LF][1] = cpi->segment_feature_data[MB_LVL_ALT_LF][1];
281 mbd->segment_feature_data[MB_LVL_ALT_LF][2] = cpi->segment_feature_data[MB_LVL_ALT_LF][2];
282 mbd->segment_feature_data[MB_LVL_ALT_LF][3] = cpi->segment_feature_data[MB_LVL_ALT_LF][3];
285 void vp8cx_pick_filter_level(YV12_BUFFER_CONFIG *sd, VP8_COMP *cpi)
287 VP8_COMMON *cm = &cpi->common;
291 int min_filter_level = get_min_filter_level(cpi, cm->base_qindex);
292 int max_filter_level = get_max_filter_level(cpi, cm->base_qindex);
296 int filt_mid = cm->filter_level; // Start search at previous frame filter level
299 int filt_direction = 0;
301 int Bias = 0; // Bias against raising loop filter and in favour of lowering it
303 // Make a copy of the unfiltered / processed recon buffer
305 #if CONFIG_RUNTIME_CPU_DETECT
306 if (cm->rtcd.flags & HAS_NEON)
309 vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(cm->frame_to_show, &cpi->last_frame_uf);
311 #if CONFIG_RUNTIME_CPU_DETECT
315 #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT
317 vp8_yv12_copy_frame_ptr(cm->frame_to_show, &cpi->last_frame_uf);
321 if (cm->frame_type == KEY_FRAME)
322 cm->sharpness_level = 0;
324 cm->sharpness_level = cpi->oxcf.Sharpness;
326 // Start the search at the previous frame filter level unless it is now out of range.
327 filt_mid = cm->filter_level;
329 if (filt_mid < min_filter_level)
330 filt_mid = min_filter_level;
331 else if (filt_mid > max_filter_level)
332 filt_mid = max_filter_level;
334 // Define the initial step size
335 filter_step = (filt_mid < 16) ? 4 : filt_mid / 4;
337 // Get baseline error score
338 vp8cx_set_alt_lf_level(cpi, filt_mid);
339 vp8_loop_filter_frame_yonly(cm, &cpi->mb.e_mbd, filt_mid, 0);
340 cm->last_frame_type = cm->frame_type;
341 cm->last_filter_type = cm->filter_type;
342 cm->last_sharpness_level = cm->sharpness_level;
344 best_err = vp8_calc_ss_err(sd, cm->frame_to_show, IF_RTCD(&cpi->rtcd.variance));
345 filt_best = filt_mid;
347 // Re-instate the unfiltered frame
349 #if CONFIG_RUNTIME_CPU_DETECT
350 if (cm->rtcd.flags & HAS_NEON)
353 vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(&cpi->last_frame_uf, cm->frame_to_show);
355 #if CONFIG_RUNTIME_CPU_DETECT
359 #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT
361 vp8_yv12_copy_frame_yonly_ptr(&cpi->last_frame_uf, cm->frame_to_show);
365 while (filter_step > 0)
367 Bias = (best_err >> (15 - (filt_mid / 8))) * filter_step; //PGW change 12/12/06 for small images
369 // jbb chg: 20100118 - in sections with lots of new material coming in don't bias as much to a low filter value
370 if (cpi->twopass.section_intra_rating < 20)
371 Bias = Bias * cpi->twopass.section_intra_rating / 20;
373 filt_high = ((filt_mid + filter_step) > max_filter_level) ? max_filter_level : (filt_mid + filter_step);
374 filt_low = ((filt_mid - filter_step) < min_filter_level) ? min_filter_level : (filt_mid - filter_step);
376 if ((filt_direction <= 0) && (filt_low != filt_mid))
378 // Get Low filter error score
379 vp8cx_set_alt_lf_level(cpi, filt_low);
380 vp8_loop_filter_frame_yonly(cm, &cpi->mb.e_mbd, filt_low, 0);
381 cm->last_frame_type = cm->frame_type;
382 cm->last_filter_type = cm->filter_type;
383 cm->last_sharpness_level = cm->sharpness_level;
385 filt_err = vp8_calc_ss_err(sd, cm->frame_to_show, IF_RTCD(&cpi->rtcd.variance));
387 // Re-instate the unfiltered frame
389 #if CONFIG_RUNTIME_CPU_DETECT
390 if (cm->rtcd.flags & HAS_NEON)
393 vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(&cpi->last_frame_uf, cm->frame_to_show);
395 #if CONFIG_RUNTIME_CPU_DETECT
399 #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT
401 vp8_yv12_copy_frame_yonly_ptr(&cpi->last_frame_uf, cm->frame_to_show);
405 // If value is close to the best so far then bias towards a lower loop filter value.
406 if ((filt_err - Bias) < best_err)
408 // Was it actually better than the previous best?
409 if (filt_err < best_err)
412 filt_best = filt_low;
416 // Now look at filt_high
417 if ((filt_direction >= 0) && (filt_high != filt_mid))
419 vp8cx_set_alt_lf_level(cpi, filt_high);
420 vp8_loop_filter_frame_yonly(cm, &cpi->mb.e_mbd, filt_high, 0);
421 cm->last_frame_type = cm->frame_type;
422 cm->last_filter_type = cm->filter_type;
423 cm->last_sharpness_level = cm->sharpness_level;
425 filt_err = vp8_calc_ss_err(sd, cm->frame_to_show, IF_RTCD(&cpi->rtcd.variance));
427 // Re-instate the unfiltered frame
429 #if CONFIG_RUNTIME_CPU_DETECT
430 if (cm->rtcd.flags & HAS_NEON)
433 vp8_yv12_copy_frame_yonly_no_extend_frame_borders_neon(&cpi->last_frame_uf, cm->frame_to_show);
435 #if CONFIG_RUNTIME_CPU_DETECT
439 #if !HAVE_ARMV7 || CONFIG_RUNTIME_CPU_DETECT
441 vp8_yv12_copy_frame_yonly_ptr(&cpi->last_frame_uf, cm->frame_to_show);
445 // Was it better than the previous best?
446 if (filt_err < (best_err - Bias))
449 filt_best = filt_high;
453 // Half the step distance if the best filter value was the same as last time
454 if (filt_best == filt_mid)
456 filter_step = filter_step / 2;
461 filt_direction = (filt_best < filt_mid) ? -1 : 1;
462 filt_mid = filt_best;
466 cm->filter_level = filt_best;