dct32x32_test.cc revision ba164dffc5a6795bce97fae02b51ccf3330e15e4
1ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang/*
2ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang *  Copyright (c) 2012 The WebM project authors. All Rights Reserved.
3ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang *
4ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang *  Use of this source code is governed by a BSD-style license
5ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang *  that can be found in the LICENSE file in the root of the source
6ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang *  tree. An additional intellectual property rights grant can be found
7ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang *  in the file PATENTS.  All contributing project authors may
8ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang *  be found in the AUTHORS file in the root of the source tree.
9ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang */
10ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
11ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include <math.h>
12ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include <stdlib.h>
13ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include <string.h>
14ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
15ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "third_party/googletest/src/include/gtest/gtest.h"
16ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
17ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangextern "C" {
18ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "vp9/common/vp9_entropy.h"
19ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "./vp9_rtcd.h"
20ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  void vp9_short_fdct32x32_c(int16_t *input, int16_t *out, int pitch);
21ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  void vp9_short_idct32x32_add_c(short *input, uint8_t *output, int pitch);
22ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
23ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
24ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "test/acm_random.h"
25ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "vpx/vpx_integer.h"
26ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
27ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangusing libvpx_test::ACMRandom;
28ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
29ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangnamespace {
30ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#ifdef _MSC_VER
31ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic int round(double x) {
32ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  if (x < 0)
33ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    return (int)ceil(x - 0.5);
34ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  else
35ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    return (int)floor(x + 0.5);
36ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
37ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#endif
38ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
39ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic const double kPi = 3.141592653589793238462643383279502884;
40ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic void reference2_32x32_idct_2d(double *input, double *output) {
41ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  double x;
42ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  for (int l = 0; l < 32; ++l) {
43ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int k = 0; k < 32; ++k) {
44ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      double s = 0;
45ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      for (int i = 0; i < 32; ++i) {
46ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang        for (int j = 0; j < 32; ++j) {
47ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          x = cos(kPi * j * (l + 0.5) / 32.0) *
48ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang              cos(kPi * i * (k + 0.5) / 32.0) * input[i * 32 + j] / 1024;
49ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          if (i != 0)
50ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang            x *= sqrt(2.0);
51ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          if (j != 0)
52ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang            x *= sqrt(2.0);
53ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          s += x;
54ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang        }
55ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      }
56ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      output[k * 32 + l] = s / 4;
57ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    }
58ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  }
59ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
60ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
61ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic void reference_32x32_dct_1d(double in[32], double out[32], int stride) {
62ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  const double kInvSqrt2 = 0.707106781186547524400844362104;
63ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  for (int k = 0; k < 32; k++) {
64ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    out[k] = 0.0;
65ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int n = 0; n < 32; n++)
66ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      out[k] += in[n] * cos(kPi * (2 * n + 1) * k / 64.0);
67ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    if (k == 0)
68ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      out[k] = out[k] * kInvSqrt2;
69ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  }
70ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
71ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
72ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic void reference_32x32_dct_2d(int16_t input[32*32], double output[32*32]) {
73ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  // First transform columns
74ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  for (int i = 0; i < 32; ++i) {
75ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    double temp_in[32], temp_out[32];
76ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 32; ++j)
77ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      temp_in[j] = input[j*32 + i];
78ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    reference_32x32_dct_1d(temp_in, temp_out, 1);
79ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 32; ++j)
80ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      output[j * 32 + i] = temp_out[j];
81ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  }
82ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  // Then transform rows
83ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  for (int i = 0; i < 32; ++i) {
84ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    double temp_in[32], temp_out[32];
85ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 32; ++j)
86ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      temp_in[j] = output[j + i*32];
87ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    reference_32x32_dct_1d(temp_in, temp_out, 1);
88ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    // Scale by some magic number
89ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 32; ++j)
90ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      output[j + i * 32] = temp_out[j] / 4;
91ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  }
92ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
93ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
94ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangTEST(VP9Idct32x32Test, AccuracyCheck) {
95ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  ACMRandom rnd(ACMRandom::DeterministicSeed());
96ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  const int count_test_block = 1000;
97ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  for (int i = 0; i < count_test_block; ++i) {
98ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    int16_t in[1024], coeff[1024];
99ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    uint8_t dst[1024], src[1024];
100ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    double out_r[1024];
101ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
102ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j) {
103ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      src[j] = rnd.Rand8();
104ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      dst[j] = rnd.Rand8();
105ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    }
106ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    // Initialize a test block with input range [-255, 255].
107ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j)
108ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      in[j] = src[j] - dst[j];
109ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
110ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    reference_32x32_dct_2d(in, out_r);
111ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; j++)
112ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      coeff[j] = round(out_r[j]);
113ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    vp9_short_idct32x32_add_c(coeff, dst, 32);
114ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j) {
115ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      const int diff = dst[j] - src[j];
116ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      const int error = diff * diff;
117ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      EXPECT_GE(1, error)
118ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          << "Error: 32x32 IDCT has error " << error
119ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          << " at index " << j;
120ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    }
121ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  }
122ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
123ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
124ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangTEST(VP9Fdct32x32Test, AccuracyCheck) {
125ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  ACMRandom rnd(ACMRandom::DeterministicSeed());
126ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  unsigned int max_error = 0;
127ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  int64_t total_error = 0;
128ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  const int count_test_block = 1000;
129ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  for (int i = 0; i < count_test_block; ++i) {
130ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    int16_t test_input_block[1024];
131ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    int16_t test_temp_block[1024];
132ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    uint8_t dst[1024], src[1024];
133ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
134ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j) {
135ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      src[j] = rnd.Rand8();
136ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      dst[j] = rnd.Rand8();
137ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    }
138ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    // Initialize a test block with input range [-255, 255].
139ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j)
140ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      test_input_block[j] = src[j] - dst[j];
141ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
142ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    const int pitch = 64;
143ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    vp9_short_fdct32x32_c(test_input_block, test_temp_block, pitch);
144ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    vp9_short_idct32x32_add_c(test_temp_block, dst, 32);
145ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
146ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j) {
147ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      const unsigned diff = dst[j] - src[j];
148ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      const unsigned error = diff * diff;
149ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      if (max_error < error)
150ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang        max_error = error;
151ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      total_error += error;
152ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    }
153ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  }
154ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
155ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  EXPECT_GE(1u, max_error)
156ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      << "Error: 32x32 FDCT/IDCT has an individual roundtrip error > 1";
157ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
158ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  EXPECT_GE(count_test_block, total_error)
159ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      << "Error: 32x32 FDCT/IDCT has average roundtrip error > 1 per block";
160ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
161ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
162ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangTEST(VP9Fdct32x32Test, CoeffSizeCheck) {
163ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  ACMRandom rnd(ACMRandom::DeterministicSeed());
164ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  const int count_test_block = 1000;
165ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  for (int i = 0; i < count_test_block; ++i) {
166ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    int16_t input_block[1024], input_extreme_block[1024];
167ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    int16_t output_block[1024], output_extreme_block[1024];
168ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
169ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    // Initialize a test block with input range [-255, 255].
170ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j) {
171ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      input_block[j] = rnd.Rand8() - rnd.Rand8();
172ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      input_extreme_block[j] = rnd.Rand8() % 2 ? 255 : -255;
173ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    }
174ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    if (i == 0)
175ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      for (int j = 0; j < 1024; ++j)
176ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang        input_extreme_block[j] = 255;
177ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
178ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    const int pitch = 64;
179ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    vp9_short_fdct32x32_c(input_block, output_block, pitch);
180ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    vp9_short_fdct32x32_c(input_extreme_block, output_extreme_block, pitch);
181ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang
182ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    // The minimum quant value is 4.
183ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    for (int j = 0; j < 1024; ++j) {
184ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      EXPECT_GE(4*DCT_MAX_VALUE, abs(output_block[j]))
185ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          << "Error: 32x32 FDCT has coefficient larger than 4*DCT_MAX_VALUE";
186ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang      EXPECT_GE(4*DCT_MAX_VALUE, abs(output_extreme_block[j]))
187ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang          << "Error: 32x32 FDCT extreme has coefficient larger than "
188ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang             "4*DCT_MAX_VALUE";
189ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang    }
190ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang  }
191ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}
192ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang}  // namespace
193