dct32x32_test.cc revision ba164dffc5a6795bce97fae02b51ccf3330e15e4
1ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang/* 2ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang * Copyright (c) 2012 The WebM project authors. All Rights Reserved. 3ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang * 4ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang * Use of this source code is governed by a BSD-style license 5ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang * that can be found in the LICENSE file in the root of the source 6ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang * tree. An additional intellectual property rights grant can be found 7ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang * in the file PATENTS. All contributing project authors may 8ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang * be found in the AUTHORS file in the root of the source tree. 9ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang */ 10ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 11ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include <math.h> 12ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include <stdlib.h> 13ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include <string.h> 14ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 15ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "third_party/googletest/src/include/gtest/gtest.h" 16ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 17ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangextern "C" { 18ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "vp9/common/vp9_entropy.h" 19ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "./vp9_rtcd.h" 20ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang void vp9_short_fdct32x32_c(int16_t *input, int16_t *out, int pitch); 21ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang void vp9_short_idct32x32_add_c(short *input, uint8_t *output, int pitch); 22ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 23ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 24ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "test/acm_random.h" 25ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#include "vpx/vpx_integer.h" 26ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 27ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangusing libvpx_test::ACMRandom; 28ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 29ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangnamespace { 30ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#ifdef _MSC_VER 31ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic int round(double x) { 32ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang if (x < 0) 33ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang return (int)ceil(x - 0.5); 34ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang else 35ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang return (int)floor(x + 0.5); 36ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 37ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang#endif 38ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 39ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic const double kPi = 3.141592653589793238462643383279502884; 40ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic void reference2_32x32_idct_2d(double *input, double *output) { 41ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang double x; 42ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int l = 0; l < 32; ++l) { 43ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int k = 0; k < 32; ++k) { 44ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang double s = 0; 45ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int i = 0; i < 32; ++i) { 46ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 32; ++j) { 47ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang x = cos(kPi * j * (l + 0.5) / 32.0) * 48ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang cos(kPi * i * (k + 0.5) / 32.0) * input[i * 32 + j] / 1024; 49ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang if (i != 0) 50ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang x *= sqrt(2.0); 51ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang if (j != 0) 52ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang x *= sqrt(2.0); 53ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang s += x; 54ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 55ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 56ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang output[k * 32 + l] = s / 4; 57ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 58ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 59ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 60ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 61ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic void reference_32x32_dct_1d(double in[32], double out[32], int stride) { 62ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const double kInvSqrt2 = 0.707106781186547524400844362104; 63ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int k = 0; k < 32; k++) { 64ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang out[k] = 0.0; 65ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int n = 0; n < 32; n++) 66ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang out[k] += in[n] * cos(kPi * (2 * n + 1) * k / 64.0); 67ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang if (k == 0) 68ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang out[k] = out[k] * kInvSqrt2; 69ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 70ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 71ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 72ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangstatic void reference_32x32_dct_2d(int16_t input[32*32], double output[32*32]) { 73ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang // First transform columns 74ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int i = 0; i < 32; ++i) { 75ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang double temp_in[32], temp_out[32]; 76ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 32; ++j) 77ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang temp_in[j] = input[j*32 + i]; 78ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang reference_32x32_dct_1d(temp_in, temp_out, 1); 79ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 32; ++j) 80ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang output[j * 32 + i] = temp_out[j]; 81ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 82ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang // Then transform rows 83ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int i = 0; i < 32; ++i) { 84ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang double temp_in[32], temp_out[32]; 85ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 32; ++j) 86ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang temp_in[j] = output[j + i*32]; 87ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang reference_32x32_dct_1d(temp_in, temp_out, 1); 88ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang // Scale by some magic number 89ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 32; ++j) 90ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang output[j + i * 32] = temp_out[j] / 4; 91ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 92ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 93ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 94ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangTEST(VP9Idct32x32Test, AccuracyCheck) { 95ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang ACMRandom rnd(ACMRandom::DeterministicSeed()); 96ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const int count_test_block = 1000; 97ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int i = 0; i < count_test_block; ++i) { 98ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang int16_t in[1024], coeff[1024]; 99ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang uint8_t dst[1024], src[1024]; 100ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang double out_r[1024]; 101ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 102ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) { 103ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang src[j] = rnd.Rand8(); 104ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang dst[j] = rnd.Rand8(); 105ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 106ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang // Initialize a test block with input range [-255, 255]. 107ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) 108ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang in[j] = src[j] - dst[j]; 109ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 110ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang reference_32x32_dct_2d(in, out_r); 111ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; j++) 112ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang coeff[j] = round(out_r[j]); 113ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang vp9_short_idct32x32_add_c(coeff, dst, 32); 114ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) { 115ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const int diff = dst[j] - src[j]; 116ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const int error = diff * diff; 117ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang EXPECT_GE(1, error) 118ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang << "Error: 32x32 IDCT has error " << error 119ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang << " at index " << j; 120ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 121ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 122ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 123ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 124ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangTEST(VP9Fdct32x32Test, AccuracyCheck) { 125ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang ACMRandom rnd(ACMRandom::DeterministicSeed()); 126ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang unsigned int max_error = 0; 127ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang int64_t total_error = 0; 128ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const int count_test_block = 1000; 129ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int i = 0; i < count_test_block; ++i) { 130ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang int16_t test_input_block[1024]; 131ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang int16_t test_temp_block[1024]; 132ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang uint8_t dst[1024], src[1024]; 133ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 134ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) { 135ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang src[j] = rnd.Rand8(); 136ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang dst[j] = rnd.Rand8(); 137ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 138ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang // Initialize a test block with input range [-255, 255]. 139ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) 140ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang test_input_block[j] = src[j] - dst[j]; 141ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 142ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const int pitch = 64; 143ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang vp9_short_fdct32x32_c(test_input_block, test_temp_block, pitch); 144ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang vp9_short_idct32x32_add_c(test_temp_block, dst, 32); 145ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 146ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) { 147ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const unsigned diff = dst[j] - src[j]; 148ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const unsigned error = diff * diff; 149ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang if (max_error < error) 150ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang max_error = error; 151ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang total_error += error; 152ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 153ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 154ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 155ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang EXPECT_GE(1u, max_error) 156ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang << "Error: 32x32 FDCT/IDCT has an individual roundtrip error > 1"; 157ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 158ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang EXPECT_GE(count_test_block, total_error) 159ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang << "Error: 32x32 FDCT/IDCT has average roundtrip error > 1 per block"; 160ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 161ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 162ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuangTEST(VP9Fdct32x32Test, CoeffSizeCheck) { 163ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang ACMRandom rnd(ACMRandom::DeterministicSeed()); 164ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const int count_test_block = 1000; 165ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int i = 0; i < count_test_block; ++i) { 166ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang int16_t input_block[1024], input_extreme_block[1024]; 167ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang int16_t output_block[1024], output_extreme_block[1024]; 168ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 169ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang // Initialize a test block with input range [-255, 255]. 170ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) { 171ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang input_block[j] = rnd.Rand8() - rnd.Rand8(); 172ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang input_extreme_block[j] = rnd.Rand8() % 2 ? 255 : -255; 173ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 174ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang if (i == 0) 175ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) 176ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang input_extreme_block[j] = 255; 177ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 178ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang const int pitch = 64; 179ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang vp9_short_fdct32x32_c(input_block, output_block, pitch); 180ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang vp9_short_fdct32x32_c(input_extreme_block, output_extreme_block, pitch); 181ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang 182ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang // The minimum quant value is 4. 183ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang for (int j = 0; j < 1024; ++j) { 184ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang EXPECT_GE(4*DCT_MAX_VALUE, abs(output_block[j])) 185ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang << "Error: 32x32 FDCT has coefficient larger than 4*DCT_MAX_VALUE"; 186ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang EXPECT_GE(4*DCT_MAX_VALUE, abs(output_extreme_block[j])) 187ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang << "Error: 32x32 FDCT extreme has coefficient larger than " 188ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang "4*DCT_MAX_VALUE"; 189ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 190ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang } 191ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} 192ba164dffc5a6795bce97fae02b51ccf3330e15e4hkuang} // namespace 193