1f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)/* 2f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) * Copyright (c) 2010 The WebM project authors. All Rights Reserved. 3f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) * 4f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) * Use of this source code is governed by a BSD-style license 5f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) * that can be found in the LICENSE file in the root of the source 6f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) * tree. An additional intellectual property rights grant can be found 7f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) * in the file PATENTS. All contributing project authors may 8f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) * be found in the AUTHORS file in the root of the source tree. 9f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) */ 10f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 11f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include <assert.h> 12f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include <limits.h> 13f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 14f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "./vpx_scale_rtcd.h" 15f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 16f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vpx_mem/vpx_mem.h" 17f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 18f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/common/vp9_loopfilter.h" 19f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/common/vp9_onyxc_int.h" 20f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/common/vp9_quant_common.h" 21f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 22f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/encoder/vp9_encoder.h" 23f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/encoder/vp9_picklpf.h" 24f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/encoder/vp9_quantize.h" 25f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 26f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)static int get_max_filter_level(const VP9_COMP *cpi) { 27f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) if (cpi->oxcf.pass == 2) { 28116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch return cpi->twopass.section_intra_rating > 8 ? MAX_LOOP_FILTER * 3 / 4 29116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch : MAX_LOOP_FILTER; 30116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch } else { 31116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch return MAX_LOOP_FILTER; 32f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) } 33116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch} 34116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch 35f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 36f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)static int try_filter_frame(const YV12_BUFFER_CONFIG *sd, VP9_COMP *const cpi, 37f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) int filt_level, int partial_frame) { 38f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) VP9_COMMON *const cm = &cpi->common; 39f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) int filt_err; 40f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 41a1401311d1ab56c4ed0a474bd38c108f75cb0cd9Torne (Richard Coles) vp9_loop_filter_frame(cm->frame_to_show, cm, &cpi->mb.e_mbd, filt_level, 1, 42010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles) partial_frame); 43010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles) filt_err = vp9_get_y_sse(sd, cm->frame_to_show); 441320f92c476a1ad9d19dba2a48c72b75566198e9Primiano Tucci 451320f92c476a1ad9d19dba2a48c72b75566198e9Primiano Tucci // Re-instate the unfiltered frame 46f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) vpx_yv12_copy_y(&cpi->last_frame_uf, cm->frame_to_show); 47010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles) 48f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) return filt_err; 49f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)} 50f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 515d1f7b1de12d16ceb2c938c56701a3e8bfa558f7Torne (Richard Coles)static int search_filter_level(const YV12_BUFFER_CONFIG *sd, VP9_COMP *cpi, 52116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch int partial_frame) { 53f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) const VP9_COMMON *const cm = &cpi->common; 54f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) const struct loopfilter *const lf = &cm->lf; 55010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles) const int min_filter_level = 0; 5646d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles) const int max_filter_level = get_max_filter_level(cpi); 57f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) int filt_direction = 0; 58116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch int best_err, filt_best; 59f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 60f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Start the search at the previous frame filter level unless it is now out of 61116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch // range. 6203b57e008b61dfcb1fbad3aea950ae0e001748b0Torne (Richard Coles) int filt_mid = clamp(lf->filter_level, min_filter_level, max_filter_level); 63116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch int filter_step = filt_mid < 16 ? 4 : filt_mid / 4; 645f1c94371a64b3196d4be9466099bb892df9b88eTorne (Richard Coles) // Sum squared error at each filter level 65f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) int ss_err[MAX_LOOP_FILTER + 1]; 66f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 67f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Set each entry to -1 68f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) vpx_memset(ss_err, 0xFF, sizeof(ss_err)); 69116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch 70116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch // Make a copy of the unfiltered / processed recon buffer 7146d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles) vpx_yv12_copy_y(cm->frame_to_show, &cpi->last_frame_uf); 7246d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles) 73f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) best_err = try_filter_frame(sd, cpi, filt_mid, partial_frame); 7446d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles) filt_best = filt_mid; 75010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles) ss_err[filt_mid] = best_err; 76f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 77f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) while (filter_step > 0) { 78f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) const int filt_high = MIN(filt_mid + filter_step, max_filter_level); 79f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) const int filt_low = MAX(filt_mid - filter_step, min_filter_level); 80f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) 81f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) // Bias against raising loop filter in favor of lowering it. 82f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) int bias = (best_err >> (15 - (filt_mid / 8))) * filter_step; 83 84 if ((cpi->oxcf.pass == 2) && (cpi->twopass.section_intra_rating < 20)) 85 bias = (bias * cpi->twopass.section_intra_rating) / 20; 86 87 // yx, bias less for large block size 88 if (cm->tx_mode != ONLY_4X4) 89 bias >>= 1; 90 91 if (filt_direction <= 0 && filt_low != filt_mid) { 92 // Get Low filter error score 93 if (ss_err[filt_low] < 0) { 94 ss_err[filt_low] = try_filter_frame(sd, cpi, filt_low, partial_frame); 95 } 96 // If value is close to the best so far then bias towards a lower loop 97 // filter value. 98 if ((ss_err[filt_low] - bias) < best_err) { 99 // Was it actually better than the previous best? 100 if (ss_err[filt_low] < best_err) 101 best_err = ss_err[filt_low]; 102 103 filt_best = filt_low; 104 } 105 } 106 107 // Now look at filt_high 108 if (filt_direction >= 0 && filt_high != filt_mid) { 109 if (ss_err[filt_high] < 0) { 110 ss_err[filt_high] = try_filter_frame(sd, cpi, filt_high, partial_frame); 111 } 112 // Was it better than the previous best? 113 if (ss_err[filt_high] < (best_err - bias)) { 114 best_err = ss_err[filt_high]; 115 filt_best = filt_high; 116 } 117 } 118 119 // Half the step distance if the best filter value was the same as last time 120 if (filt_best == filt_mid) { 121 filter_step /= 2; 122 filt_direction = 0; 123 } else { 124 filt_direction = (filt_best < filt_mid) ? -1 : 1; 125 filt_mid = filt_best; 126 } 127 } 128 129 return filt_best; 130} 131 132void vp9_pick_filter_level(const YV12_BUFFER_CONFIG *sd, VP9_COMP *cpi, 133 LPF_PICK_METHOD method) { 134 VP9_COMMON *const cm = &cpi->common; 135 struct loopfilter *const lf = &cm->lf; 136 137 lf->sharpness_level = cm->frame_type == KEY_FRAME ? 0 138 : cpi->oxcf.sharpness; 139 140 if (method == LPF_PICK_MINIMAL_LPF && lf->filter_level) { 141 lf->filter_level = 0; 142 } else if (method >= LPF_PICK_FROM_Q) { 143 const int min_filter_level = 0; 144 const int max_filter_level = get_max_filter_level(cpi); 145 const int q = vp9_ac_quant(cm->base_qindex, 0, cm->bit_depth); 146 // These values were determined by linear fitting the result of the 147 // searched level, filt_guess = q * 0.316206 + 3.87252 148 int filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 1015158, 18); 149 if (cm->frame_type == KEY_FRAME) 150 filt_guess -= 4; 151 lf->filter_level = clamp(filt_guess, min_filter_level, max_filter_level); 152 } else { 153 lf->filter_level = search_filter_level(sd, cpi, 154 method == LPF_PICK_FROM_SUBIMAGE); 155 } 156} 157