1f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)/*
2f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) *  Copyright (c) 2010 The WebM project authors. All Rights Reserved.
3f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) *
4f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) *  Use of this source code is governed by a BSD-style license
5f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) *  that can be found in the LICENSE file in the root of the source
6f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) *  tree. An additional intellectual property rights grant can be found
7f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) *  in the file PATENTS.  All contributing project authors may
8f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) *  be found in the AUTHORS file in the root of the source tree.
9f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles) */
10f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
11f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include <assert.h>
12f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include <limits.h>
13f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
14f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "./vpx_scale_rtcd.h"
15f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
16f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vpx_mem/vpx_mem.h"
17f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
18f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/common/vp9_loopfilter.h"
19f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/common/vp9_onyxc_int.h"
20f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/common/vp9_quant_common.h"
21f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
22f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/encoder/vp9_encoder.h"
23f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/encoder/vp9_picklpf.h"
24f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)#include "vp9/encoder/vp9_quantize.h"
25f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
26f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)static int get_max_filter_level(const VP9_COMP *cpi) {
27f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  if (cpi->oxcf.pass == 2) {
28116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch    return cpi->twopass.section_intra_rating > 8 ? MAX_LOOP_FILTER * 3 / 4
29116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch                                                 : MAX_LOOP_FILTER;
30116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch  } else {
31116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch    return MAX_LOOP_FILTER;
32f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  }
33116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch}
34116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch
35f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
36f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)static int try_filter_frame(const YV12_BUFFER_CONFIG *sd, VP9_COMP *const cpi,
37f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)                            int filt_level, int partial_frame) {
38f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  VP9_COMMON *const cm = &cpi->common;
39f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  int filt_err;
40f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
41a1401311d1ab56c4ed0a474bd38c108f75cb0cd9Torne (Richard Coles)  vp9_loop_filter_frame(cm->frame_to_show, cm, &cpi->mb.e_mbd, filt_level, 1,
42010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles)                        partial_frame);
43010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles)  filt_err = vp9_get_y_sse(sd, cm->frame_to_show);
441320f92c476a1ad9d19dba2a48c72b75566198e9Primiano Tucci
451320f92c476a1ad9d19dba2a48c72b75566198e9Primiano Tucci  // Re-instate the unfiltered frame
46f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  vpx_yv12_copy_y(&cpi->last_frame_uf, cm->frame_to_show);
47010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles)
48f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  return filt_err;
49f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)}
50f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
515d1f7b1de12d16ceb2c938c56701a3e8bfa558f7Torne (Richard Coles)static int search_filter_level(const YV12_BUFFER_CONFIG *sd, VP9_COMP *cpi,
52116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch                               int partial_frame) {
53f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  const VP9_COMMON *const cm = &cpi->common;
54f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  const struct loopfilter *const lf = &cm->lf;
55010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles)  const int min_filter_level = 0;
5646d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles)  const int max_filter_level = get_max_filter_level(cpi);
57f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  int filt_direction = 0;
58116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch  int best_err, filt_best;
59f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
60f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // Start the search at the previous frame filter level unless it is now out of
61116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch  // range.
6203b57e008b61dfcb1fbad3aea950ae0e001748b0Torne (Richard Coles)  int filt_mid = clamp(lf->filter_level, min_filter_level, max_filter_level);
63116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch  int filter_step = filt_mid < 16 ? 4 : filt_mid / 4;
645f1c94371a64b3196d4be9466099bb892df9b88eTorne (Richard Coles)  // Sum squared error at each filter level
65f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  int ss_err[MAX_LOOP_FILTER + 1];
66f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
67f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  // Set each entry to -1
68f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  vpx_memset(ss_err, 0xFF, sizeof(ss_err));
69116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch
70116680a4aac90f2aa7413d9095a592090648e557Ben Murdoch  //  Make a copy of the unfiltered / processed recon buffer
7146d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles)  vpx_yv12_copy_y(cm->frame_to_show, &cpi->last_frame_uf);
7246d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles)
73f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  best_err = try_filter_frame(sd, cpi, filt_mid, partial_frame);
7446d4c2bc3267f3f028f39e7e311b0f89aba2e4fdTorne (Richard Coles)  filt_best = filt_mid;
75010d83a9304c5a91596085d917d248abff47903aTorne (Richard Coles)  ss_err[filt_mid] = best_err;
76f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
77f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)  while (filter_step > 0) {
78f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    const int filt_high = MIN(filt_mid + filter_step, max_filter_level);
79f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    const int filt_low = MAX(filt_mid - filter_step, min_filter_level);
80f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)
81f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    // Bias against raising loop filter in favor of lowering it.
82f2477e01787aa58f445919b809d89e252beef54fTorne (Richard Coles)    int bias = (best_err >> (15 - (filt_mid / 8))) * filter_step;
83
84    if ((cpi->oxcf.pass == 2) && (cpi->twopass.section_intra_rating < 20))
85      bias = (bias * cpi->twopass.section_intra_rating) / 20;
86
87    // yx, bias less for large block size
88    if (cm->tx_mode != ONLY_4X4)
89      bias >>= 1;
90
91    if (filt_direction <= 0 && filt_low != filt_mid) {
92      // Get Low filter error score
93      if (ss_err[filt_low] < 0) {
94        ss_err[filt_low] = try_filter_frame(sd, cpi, filt_low, partial_frame);
95      }
96      // If value is close to the best so far then bias towards a lower loop
97      // filter value.
98      if ((ss_err[filt_low] - bias) < best_err) {
99        // Was it actually better than the previous best?
100        if (ss_err[filt_low] < best_err)
101          best_err = ss_err[filt_low];
102
103        filt_best = filt_low;
104      }
105    }
106
107    // Now look at filt_high
108    if (filt_direction >= 0 && filt_high != filt_mid) {
109      if (ss_err[filt_high] < 0) {
110        ss_err[filt_high] = try_filter_frame(sd, cpi, filt_high, partial_frame);
111      }
112      // Was it better than the previous best?
113      if (ss_err[filt_high] < (best_err - bias)) {
114        best_err = ss_err[filt_high];
115        filt_best = filt_high;
116      }
117    }
118
119    // Half the step distance if the best filter value was the same as last time
120    if (filt_best == filt_mid) {
121      filter_step /= 2;
122      filt_direction = 0;
123    } else {
124      filt_direction = (filt_best < filt_mid) ? -1 : 1;
125      filt_mid = filt_best;
126    }
127  }
128
129  return filt_best;
130}
131
132void vp9_pick_filter_level(const YV12_BUFFER_CONFIG *sd, VP9_COMP *cpi,
133                           LPF_PICK_METHOD method) {
134  VP9_COMMON *const cm = &cpi->common;
135  struct loopfilter *const lf = &cm->lf;
136
137  lf->sharpness_level = cm->frame_type == KEY_FRAME ? 0
138                                                    : cpi->oxcf.sharpness;
139
140  if (method == LPF_PICK_MINIMAL_LPF && lf->filter_level) {
141      lf->filter_level = 0;
142  } else if (method >= LPF_PICK_FROM_Q) {
143    const int min_filter_level = 0;
144    const int max_filter_level = get_max_filter_level(cpi);
145    const int q = vp9_ac_quant(cm->base_qindex, 0, cm->bit_depth);
146    // These values were determined by linear fitting the result of the
147    // searched level, filt_guess = q * 0.316206 + 3.87252
148    int filt_guess = ROUND_POWER_OF_TWO(q * 20723 + 1015158, 18);
149    if (cm->frame_type == KEY_FRAME)
150      filt_guess -= 4;
151    lf->filter_level = clamp(filt_guess, min_filter_level, max_filter_level);
152  } else {
153    lf->filter_level = search_filter_level(sd, cpi,
154                                           method == LPF_PICK_FROM_SUBIMAGE);
155  }
156}
157