Merge "Use bigdia search with pruned subpel search"
[platform/upstream/libvpx.git] / vp9 / encoder / vp9_speed_features.c
1 /*
2  *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
3  *
4  *  Use of this source code is governed by a BSD-style license
5  *  that can be found in the LICENSE file in the root of the source
6  *  tree. An additional intellectual property rights grant can be found
7  *  in the file PATENTS.  All contributing project authors may
8  *  be found in the AUTHORS file in the root of the source tree.
9  */
10
11 #include <limits.h>
12
13 #include "vp9/encoder/vp9_encoder.h"
14 #include "vp9/encoder/vp9_speed_features.h"
15
16 // Intra only frames, golden frames (except alt ref overlays) and
17 // alt ref frames tend to be coded at a higher than ambient quality
18 static int frame_is_boosted(const VP9_COMP *cpi) {
19   return frame_is_intra_only(&cpi->common) ||
20          cpi->refresh_alt_ref_frame ||
21          (cpi->refresh_golden_frame && !cpi->rc.is_src_frame_alt_ref) ||
22          vp9_is_upper_layer_key_frame(cpi);
23 }
24
25
26 static void set_good_speed_feature(VP9_COMP *cpi, VP9_COMMON *cm,
27                                    SPEED_FEATURES *sf, int speed) {
28   const int boosted = frame_is_boosted(cpi);
29
30   sf->adaptive_rd_thresh = 1;
31   sf->allow_skip_recode = 1;
32
33   if (speed >= 1) {
34     sf->use_square_partition_only = !frame_is_intra_only(cm);
35     sf->less_rectangular_check  = 1;
36
37     if (MIN(cm->width, cm->height) >= 720)
38       sf->disable_split_mask = cm->show_frame ? DISABLE_ALL_SPLIT
39                                               : DISABLE_ALL_INTER_SPLIT;
40     else
41       sf->disable_split_mask = DISABLE_COMPOUND_SPLIT;
42     sf->use_rd_breakout = 1;
43     sf->adaptive_motion_search = 1;
44     sf->mv.auto_mv_step_size = 1;
45     sf->adaptive_rd_thresh = 2;
46     sf->mv.subpel_iters_per_step = 1;
47     sf->mode_skip_start = 10;
48     sf->adaptive_pred_interp_filter = 1;
49
50     sf->recode_loop = ALLOW_RECODE_KFARFGF;
51     sf->intra_y_mode_mask[TX_32X32] = INTRA_DC_H_V;
52     sf->intra_uv_mode_mask[TX_32X32] = INTRA_DC_H_V;
53     sf->intra_y_mode_mask[TX_16X16] = INTRA_DC_H_V;
54     sf->intra_uv_mode_mask[TX_16X16] = INTRA_DC_H_V;
55
56     sf->tx_size_search_breakout = 1;
57
58     if (MIN(cm->width, cm->height) >= 720)
59       sf->partition_search_breakout_dist_thr = (1 << 23);
60     else
61       sf->partition_search_breakout_dist_thr = (1 << 21);
62     sf->partition_search_breakout_rate_thr = 500;
63   }
64
65   if (speed >= 2) {
66     sf->tx_size_search_method = frame_is_boosted(cpi) ? USE_FULL_RD
67                                                       : USE_LARGESTALL;
68
69     if (MIN(cm->width, cm->height) >= 720) {
70       sf->disable_split_mask = cm->show_frame ? DISABLE_ALL_SPLIT
71                                               : DISABLE_ALL_INTER_SPLIT;
72       sf->adaptive_pred_interp_filter = 0;
73     } else {
74       sf->disable_split_mask = LAST_AND_INTRA_SPLIT_ONLY;
75     }
76
77     sf->reference_masking = 1;
78     sf->mode_search_skip_flags = FLAG_SKIP_INTRA_DIRMISMATCH |
79                                  FLAG_SKIP_INTRA_BESTINTER |
80                                  FLAG_SKIP_COMP_BESTINTRA |
81                                  FLAG_SKIP_INTRA_LOWVAR;
82     sf->disable_filter_search_var_thresh = 100;
83     sf->comp_inter_joint_search_thresh = BLOCK_SIZES;
84     sf->auto_min_max_partition_size = CONSTRAIN_NEIGHBORING_MIN_MAX;
85
86     if (MIN(cm->width, cm->height) >= 720)
87       sf->partition_search_breakout_dist_thr = (1 << 24);
88     else
89       sf->partition_search_breakout_dist_thr = (1 << 22);
90     sf->partition_search_breakout_rate_thr = 700;
91   }
92
93   if (speed >= 3) {
94     sf->tx_size_search_method = frame_is_intra_only(cm) ? USE_FULL_RD
95                                                         : USE_LARGESTALL;
96     if (MIN(cm->width, cm->height) >= 720) {
97       sf->disable_split_mask = DISABLE_ALL_SPLIT;
98     } else {
99       sf->max_intra_bsize = BLOCK_32X32;
100       sf->disable_split_mask = DISABLE_ALL_INTER_SPLIT;
101     }
102     sf->adaptive_pred_interp_filter = 0;
103     sf->adaptive_mode_search = 1;
104     sf->cb_partition_search = !boosted;
105     sf->cb_pred_filter_search = 1;
106     sf->alt_ref_search_fp = 1;
107     sf->motion_field_mode_search = !boosted;
108     sf->recode_loop = ALLOW_RECODE_KFMAXBW;
109     sf->adaptive_rd_thresh = 3;
110     sf->mode_skip_start = 6;
111     sf->intra_y_mode_mask[TX_32X32] = INTRA_DC;
112     sf->intra_uv_mode_mask[TX_32X32] = INTRA_DC;
113     sf->adaptive_interp_filter_search = 1;
114
115     if (MIN(cm->width, cm->height) >= 720)
116       sf->partition_search_breakout_dist_thr = (1 << 25);
117     else
118       sf->partition_search_breakout_dist_thr = (1 << 23);
119     sf->partition_search_breakout_rate_thr = 1000;
120   }
121
122   if (speed >= 4) {
123     sf->use_square_partition_only = 1;
124     sf->tx_size_search_method = USE_LARGESTALL;
125     sf->disable_split_mask = DISABLE_ALL_SPLIT;
126     sf->mv.search_method = BIGDIA;
127     sf->mv.subpel_search_method = SUBPEL_TREE_PRUNED;
128     sf->adaptive_rd_thresh = 4;
129     sf->mode_search_skip_flags |= FLAG_SKIP_COMP_REFMISMATCH |
130                                   FLAG_EARLY_TERMINATE;
131     sf->disable_filter_search_var_thresh = 200;
132     sf->use_lp32x32fdct = 1;
133     sf->use_fast_coef_updates = ONE_LOOP_REDUCED;
134     sf->use_fast_coef_costing = 1;
135
136     if (MIN(cm->width, cm->height) >= 720)
137       sf->partition_search_breakout_dist_thr = (1 << 26);
138     else
139       sf->partition_search_breakout_dist_thr = (1 << 24);
140     sf->partition_search_breakout_rate_thr = 1500;
141   }
142
143   if (speed >= 5) {
144     int i;
145
146     sf->partition_search_type = FIXED_PARTITION;
147     sf->optimize_coefficients = 0;
148     sf->mv.search_method = HEX;
149     sf->disable_filter_search_var_thresh = 500;
150     for (i = 0; i < TX_SIZES; ++i) {
151       sf->intra_y_mode_mask[i] = INTRA_DC;
152       sf->intra_uv_mode_mask[i] = INTRA_DC;
153     }
154     cpi->allow_encode_breakout = ENCODE_BREAKOUT_ENABLED;
155   }
156   if (speed >= 6) {
157     sf->mv.reduce_first_step_size = 1;
158   }
159 }
160
161 static void set_rt_speed_feature(VP9_COMP *cpi, SPEED_FEATURES *sf,
162                                  int speed, vp9e_tune_content content) {
163   VP9_COMMON *const cm = &cpi->common;
164   const int is_keyframe = cm->frame_type == KEY_FRAME;
165   const int frames_since_key = is_keyframe ? 0 : cpi->rc.frames_since_key;
166   sf->static_segmentation = 0;
167   sf->adaptive_rd_thresh = 1;
168   sf->use_fast_coef_costing = 1;
169
170   if (speed >= 1) {
171     sf->use_square_partition_only = !frame_is_intra_only(cm);
172     sf->less_rectangular_check = 1;
173     sf->tx_size_search_method = frame_is_intra_only(cm) ? USE_FULL_RD
174                                                         : USE_LARGESTALL;
175
176     if (MIN(cm->width, cm->height) >= 720)
177       sf->disable_split_mask = cm->show_frame ? DISABLE_ALL_SPLIT
178                                               : DISABLE_ALL_INTER_SPLIT;
179     else
180       sf->disable_split_mask = DISABLE_COMPOUND_SPLIT;
181
182     sf->use_rd_breakout = 1;
183
184     sf->adaptive_motion_search = 1;
185     sf->adaptive_pred_interp_filter = 1;
186     sf->mv.auto_mv_step_size = 1;
187     sf->adaptive_rd_thresh = 2;
188     sf->intra_y_mode_mask[TX_32X32] = INTRA_DC_H_V;
189     sf->intra_uv_mode_mask[TX_32X32] = INTRA_DC_H_V;
190     sf->intra_uv_mode_mask[TX_16X16] = INTRA_DC_H_V;
191   }
192
193   if (speed >= 2) {
194     if (MIN(cm->width, cm->height) >= 720)
195       sf->disable_split_mask = cm->show_frame ? DISABLE_ALL_SPLIT
196                                               : DISABLE_ALL_INTER_SPLIT;
197     else
198       sf->disable_split_mask = LAST_AND_INTRA_SPLIT_ONLY;
199
200     sf->mode_search_skip_flags = FLAG_SKIP_INTRA_DIRMISMATCH |
201                                  FLAG_SKIP_INTRA_BESTINTER |
202                                  FLAG_SKIP_COMP_BESTINTRA |
203                                  FLAG_SKIP_INTRA_LOWVAR;
204     sf->adaptive_pred_interp_filter = 2;
205     sf->reference_masking = 1;
206     sf->disable_filter_search_var_thresh = 50;
207     sf->comp_inter_joint_search_thresh = BLOCK_SIZES;
208     sf->auto_min_max_partition_size = RELAXED_NEIGHBORING_MIN_MAX;
209     sf->use_lastframe_partitioning = LAST_FRAME_PARTITION_LOW_MOTION;
210     sf->lf_motion_threshold = LOW_MOTION_THRESHOLD;
211     sf->adjust_partitioning_from_last_frame = 1;
212     sf->last_partitioning_redo_frequency = 3;
213     sf->use_lp32x32fdct = 1;
214     sf->mode_skip_start = 11;
215     sf->intra_y_mode_mask[TX_16X16] = INTRA_DC_H_V;
216   }
217
218   if (speed >= 3) {
219     sf->use_square_partition_only = 1;
220     sf->disable_filter_search_var_thresh = 100;
221     sf->use_lastframe_partitioning = LAST_FRAME_PARTITION_ALL;
222     sf->constrain_copy_partition = 1;
223     sf->use_uv_intra_rd_estimate = 1;
224     sf->skip_encode_sb = 1;
225     sf->mv.subpel_iters_per_step = 1;
226     sf->use_fast_coef_updates = ONE_LOOP_REDUCED;
227     sf->adaptive_rd_thresh = 4;
228     sf->mode_skip_start = 6;
229     sf->allow_skip_recode = 0;
230     sf->optimize_coefficients = 0;
231     sf->disable_split_mask = DISABLE_ALL_SPLIT;
232     sf->lpf_pick = LPF_PICK_FROM_Q;
233   }
234
235   if (speed >= 4) {
236     int i;
237     sf->last_partitioning_redo_frequency = 4;
238     sf->adaptive_rd_thresh = 5;
239     sf->use_fast_coef_costing = 0;
240     sf->auto_min_max_partition_size = STRICT_NEIGHBORING_MIN_MAX;
241     sf->adjust_partitioning_from_last_frame =
242         cm->last_frame_type != cm->frame_type || (0 ==
243         (frames_since_key + 1) % sf->last_partitioning_redo_frequency);
244     sf->mv.subpel_force_stop = 1;
245     for (i = 0; i < TX_SIZES; i++) {
246       sf->intra_y_mode_mask[i] = INTRA_DC_H_V;
247       sf->intra_uv_mode_mask[i] = INTRA_DC;
248     }
249     sf->intra_y_mode_mask[TX_32X32] = INTRA_DC;
250     sf->frame_parameter_update = 0;
251     sf->mv.search_method = FAST_HEX;
252     sf->inter_mode_mask[BLOCK_32X32] = INTER_NEAREST_NEAR_NEW;
253     sf->inter_mode_mask[BLOCK_32X64] = INTER_NEAREST;
254     sf->inter_mode_mask[BLOCK_64X32] = INTER_NEAREST;
255     sf->inter_mode_mask[BLOCK_64X64] = INTER_NEAREST;
256     sf->max_intra_bsize = BLOCK_32X32;
257     sf->allow_skip_recode = 1;
258   }
259
260   if (speed >= 5) {
261     sf->use_quant_fp = !is_keyframe;
262     sf->auto_min_max_partition_size = is_keyframe ? RELAXED_NEIGHBORING_MIN_MAX
263                                                   : STRICT_NEIGHBORING_MIN_MAX;
264     sf->max_partition_size = BLOCK_32X32;
265     sf->min_partition_size = BLOCK_8X8;
266     sf->partition_check =
267         (frames_since_key % sf->last_partitioning_redo_frequency == 1);
268     sf->force_frame_boost = is_keyframe ||
269         (frames_since_key % (sf->last_partitioning_redo_frequency << 1) == 1);
270     sf->max_delta_qindex = is_keyframe ? 20 : 15;
271     sf->partition_search_type = REFERENCE_PARTITION;
272     sf->use_nonrd_pick_mode = 1;
273     sf->allow_skip_recode = 0;
274   }
275
276   if (speed >= 6) {
277     if (content == VP9E_CONTENT_SCREEN) {
278       int i;
279       // Allow fancy modes at all sizes since SOURCE_VAR_BASED_PARTITION is used
280       for (i = 0; i < BLOCK_SIZES; ++i)
281         sf->inter_mode_mask[i] = INTER_ALL;
282     }
283
284     // Adaptively switch between SOURCE_VAR_BASED_PARTITION and FIXED_PARTITION.
285     sf->partition_search_type = SOURCE_VAR_BASED_PARTITION;
286     sf->search_type_check_frequency = 50;
287
288     sf->tx_size_search_method = is_keyframe ? USE_LARGESTALL : USE_TX_8X8;
289
290     // This feature is only enabled when partition search is disabled.
291     sf->reuse_inter_pred_sby = 1;
292
293     // Increase mode checking threshold for NEWMV.
294     sf->elevate_newmv_thresh = 2000;
295
296     sf->mv.reduce_first_step_size = 1;
297   }
298
299   if (speed >= 7) {
300     sf->mv.search_method = FAST_DIAMOND;
301     sf->mv.fullpel_search_step_param = 10;
302     sf->lpf_pick = LPF_PICK_MINIMAL_LPF;
303     sf->encode_breakout_thresh = (MIN(cm->width, cm->height) >= 720) ?
304         800 : 300;
305     sf->elevate_newmv_thresh = 2500;
306   }
307
308   if (speed >= 12) {
309     sf->elevate_newmv_thresh = 4000;
310     sf->mv.subpel_force_stop = 2;
311   }
312
313   if (speed >= 13) {
314     int i;
315     sf->max_intra_bsize = BLOCK_32X32;
316     for (i = 0; i < BLOCK_SIZES; ++i)
317       sf->inter_mode_mask[i] = INTER_NEAREST;
318   }
319 }
320
321 void vp9_set_speed_features(VP9_COMP *cpi) {
322   SPEED_FEATURES *const sf = &cpi->sf;
323   VP9_COMMON *const cm = &cpi->common;
324   const VP9EncoderConfig *const oxcf = &cpi->oxcf;
325   int i;
326
327   // best quality defaults
328   sf->frame_parameter_update = 1;
329   sf->mv.search_method = NSTEP;
330   sf->recode_loop = ALLOW_RECODE;
331   sf->mv.subpel_search_method = SUBPEL_TREE;
332   sf->mv.subpel_iters_per_step = 2;
333   sf->mv.subpel_force_stop = 0;
334   sf->optimize_coefficients = !is_lossless_requested(&cpi->oxcf);
335   sf->mv.reduce_first_step_size = 0;
336   sf->mv.auto_mv_step_size = 0;
337   sf->mv.fullpel_search_step_param = 6;
338   sf->comp_inter_joint_search_thresh = BLOCK_4X4;
339   sf->adaptive_rd_thresh = 0;
340   sf->use_lastframe_partitioning = LAST_FRAME_PARTITION_OFF;
341   sf->tx_size_search_method = USE_FULL_RD;
342   sf->use_lp32x32fdct = 0;
343   sf->adaptive_motion_search = 0;
344   sf->adaptive_pred_interp_filter = 0;
345   sf->adaptive_mode_search = 0;
346   sf->cb_pred_filter_search = 0;
347   sf->cb_partition_search = 0;
348   sf->motion_field_mode_search = 0;
349   sf->alt_ref_search_fp = 0;
350   sf->use_quant_fp = 0;
351   sf->reference_masking = 0;
352   sf->partition_search_type = SEARCH_PARTITION;
353   sf->less_rectangular_check = 0;
354   sf->use_square_partition_only = 0;
355   sf->auto_min_max_partition_size = NOT_IN_USE;
356   sf->max_partition_size = BLOCK_64X64;
357   sf->min_partition_size = BLOCK_4X4;
358   sf->adjust_partitioning_from_last_frame = 0;
359   sf->last_partitioning_redo_frequency = 4;
360   sf->constrain_copy_partition = 0;
361   sf->disable_split_mask = 0;
362   sf->mode_search_skip_flags = 0;
363   sf->force_frame_boost = 0;
364   sf->max_delta_qindex = 0;
365   sf->disable_filter_search_var_thresh = 0;
366   sf->adaptive_interp_filter_search = 0;
367
368   for (i = 0; i < TX_SIZES; i++) {
369     sf->intra_y_mode_mask[i] = INTRA_ALL;
370     sf->intra_uv_mode_mask[i] = INTRA_ALL;
371   }
372   sf->use_rd_breakout = 0;
373   sf->skip_encode_sb = 0;
374   sf->use_uv_intra_rd_estimate = 0;
375   sf->allow_skip_recode = 0;
376   sf->lpf_pick = LPF_PICK_FROM_FULL_IMAGE;
377   sf->use_fast_coef_updates = TWO_LOOP;
378   sf->use_fast_coef_costing = 0;
379   sf->mode_skip_start = MAX_MODES;  // Mode index at which mode skip mask set
380   sf->use_nonrd_pick_mode = 0;
381   for (i = 0; i < BLOCK_SIZES; ++i)
382     sf->inter_mode_mask[i] = INTER_ALL;
383   sf->max_intra_bsize = BLOCK_64X64;
384   sf->reuse_inter_pred_sby = 0;
385   // This setting only takes effect when partition_search_type is set
386   // to FIXED_PARTITION.
387   sf->always_this_block_size = BLOCK_16X16;
388   sf->search_type_check_frequency = 50;
389   sf->encode_breakout_thresh = 0;
390   sf->elevate_newmv_thresh = 0;
391   // Recode loop tolerence %.
392   sf->recode_tolerance = 25;
393   sf->default_interp_filter = SWITCHABLE;
394   sf->tx_size_search_breakout = 0;
395   sf->partition_search_breakout_dist_thr = 0;
396   sf->partition_search_breakout_rate_thr = 0;
397
398   if (oxcf->mode == REALTIME)
399     set_rt_speed_feature(cpi, sf, oxcf->speed, oxcf->content);
400   else if (oxcf->mode == GOOD)
401     set_good_speed_feature(cpi, cm, sf, oxcf->speed);
402
403   cpi->full_search_sad = vp9_full_search_sad;
404   cpi->diamond_search_sad = oxcf->mode == BEST ? vp9_full_range_search
405                                                : vp9_diamond_search_sad;
406   cpi->refining_search_sad = vp9_refining_search_sad;
407
408
409   // Slow quant, dct and trellis not worthwhile for first pass
410   // so make sure they are always turned off.
411   if (oxcf->pass == 1)
412     sf->optimize_coefficients = 0;
413
414   // No recode for 1 pass.
415   if (oxcf->pass == 0) {
416     sf->recode_loop = DISALLOW_RECODE;
417     sf->optimize_coefficients = 0;
418   }
419
420   if (sf->mv.subpel_search_method == SUBPEL_TREE) {
421     cpi->find_fractional_mv_step = vp9_find_best_sub_pixel_tree;
422   } else if (sf->mv.subpel_search_method == SUBPEL_TREE_PRUNED) {
423     cpi->find_fractional_mv_step = vp9_find_best_sub_pixel_tree_pruned;
424   }
425
426   cpi->mb.optimize = sf->optimize_coefficients == 1 && oxcf->pass != 1;
427
428   if (sf->disable_split_mask == DISABLE_ALL_SPLIT)
429     sf->adaptive_pred_interp_filter = 0;
430
431   if (!cpi->oxcf.frame_periodic_boost) {
432     sf->max_delta_qindex = 0;
433   }
434
435   if (cpi->encode_breakout && oxcf->mode == REALTIME &&
436       sf->encode_breakout_thresh > cpi->encode_breakout)
437     cpi->encode_breakout = sf->encode_breakout_thresh;
438 }