1// Copyright 2010 Google Inc. All Rights Reserved.
2//
3// Use of this source code is governed by a BSD-style license
4// that can be found in the COPYING file in the root of the source
5// tree. An additional intellectual property rights grant can be found
6// in the file PATENTS. All contributing project authors may
7// be found in the AUTHORS file in the root of the source tree.
8// -----------------------------------------------------------------------------
9//
10// VP8 decoder: internal header.
11//
12// Author: Skal (pascal.massimino@gmail.com)
13
14#ifndef WEBP_DEC_VP8I_H_
15#define WEBP_DEC_VP8I_H_
16
17#include <string.h>     // for memcpy()
18#include "./vp8li.h"
19#include "../utils/bit_reader.h"
20#include "../utils/random.h"
21#include "../utils/thread.h"
22#include "../dsp/dsp.h"
23
24#ifdef __cplusplus
25extern "C" {
26#endif
27
28//------------------------------------------------------------------------------
29// Various defines and enums
30
31// version numbers
32#define DEC_MAJ_VERSION 0
33#define DEC_MIN_VERSION 4
34#define DEC_REV_VERSION 1
35
36// intra prediction modes
37enum { B_DC_PRED = 0,   // 4x4 modes
38       B_TM_PRED,
39       B_VE_PRED,
40       B_HE_PRED,
41       B_RD_PRED,
42       B_VR_PRED,
43       B_LD_PRED,
44       B_VL_PRED,
45       B_HD_PRED,
46       B_HU_PRED,
47       NUM_BMODES = B_HU_PRED + 1 - B_DC_PRED,  // = 10
48
49       // Luma16 or UV modes
50       DC_PRED = B_DC_PRED, V_PRED = B_VE_PRED,
51       H_PRED = B_HE_PRED, TM_PRED = B_TM_PRED,
52       B_PRED = NUM_BMODES,   // refined I4x4 mode
53
54       // special modes
55       B_DC_PRED_NOTOP = 4,
56       B_DC_PRED_NOLEFT = 5,
57       B_DC_PRED_NOTOPLEFT = 6,
58       NUM_B_DC_MODES = 7 };
59
60enum { MB_FEATURE_TREE_PROBS = 3,
61       NUM_MB_SEGMENTS = 4,
62       NUM_REF_LF_DELTAS = 4,
63       NUM_MODE_LF_DELTAS = 4,    // I4x4, ZERO, *, SPLIT
64       MAX_NUM_PARTITIONS = 8,
65       // Probabilities
66       NUM_TYPES = 4,
67       NUM_BANDS = 8,
68       NUM_CTX = 3,
69       NUM_PROBAS = 11,
70       NUM_MV_PROBAS = 19 };
71
72// YUV-cache parameters.
73// Constraints are: We need to store one 16x16 block of luma samples (y),
74// and two 8x8 chroma blocks (u/v). These are better be 16-bytes aligned,
75// in order to be SIMD-friendly. We also need to store the top, left and
76// top-left samples (from previously decoded blocks), along with four
77// extra top-right samples for luma (intra4x4 prediction only).
78// One possible layout is, using 32 * (17 + 9) bytes:
79//
80//   .+------   <- only 1 pixel high
81//   .|yyyyt.
82//   .|yyyyt.
83//   .|yyyyt.
84//   .|yyyy..
85//   .+--.+--   <- only 1 pixel high
86//   .|uu.|vv
87//   .|uu.|vv
88//
89// Every character is a 4x4 block, with legend:
90//  '.' = unused
91//  'y' = y-samples   'u' = u-samples     'v' = u-samples
92//  '|' = left sample,   '-' = top sample,    '+' = top-left sample
93//  't' = extra top-right sample for 4x4 modes
94// With this layout, BPS (=Bytes Per Scan-line) is one cacheline size.
95#define BPS       32    // this is the common stride used by yuv[]
96#define YUV_SIZE (BPS * 17 + BPS * 9)
97#define Y_SIZE   (BPS * 17)
98#define Y_OFF    (BPS * 1 + 8)
99#define U_OFF    (Y_OFF + BPS * 16 + BPS)
100#define V_OFF    (U_OFF + 16)
101
102// minimal width under which lossy multi-threading is always disabled
103#define MIN_WIDTH_FOR_THREADS 512
104
105//------------------------------------------------------------------------------
106// Headers
107
108typedef struct {
109  uint8_t key_frame_;
110  uint8_t profile_;
111  uint8_t show_;
112  uint32_t partition_length_;
113} VP8FrameHeader;
114
115typedef struct {
116  uint16_t width_;
117  uint16_t height_;
118  uint8_t xscale_;
119  uint8_t yscale_;
120  uint8_t colorspace_;   // 0 = YCbCr
121  uint8_t clamp_type_;
122} VP8PictureHeader;
123
124// segment features
125typedef struct {
126  int use_segment_;
127  int update_map_;        // whether to update the segment map or not
128  int absolute_delta_;    // absolute or delta values for quantizer and filter
129  int8_t quantizer_[NUM_MB_SEGMENTS];        // quantization changes
130  int8_t filter_strength_[NUM_MB_SEGMENTS];  // filter strength for segments
131} VP8SegmentHeader;
132
133
134// probas associated to one of the contexts
135typedef uint8_t VP8ProbaArray[NUM_PROBAS];
136
137typedef struct {   // all the probas associated to one band
138  VP8ProbaArray probas_[NUM_CTX];
139} VP8BandProbas;
140
141// Struct collecting all frame-persistent probabilities.
142typedef struct {
143  uint8_t segments_[MB_FEATURE_TREE_PROBS];
144  // Type: 0:Intra16-AC  1:Intra16-DC   2:Chroma   3:Intra4
145  VP8BandProbas bands_[NUM_TYPES][NUM_BANDS];
146} VP8Proba;
147
148// Filter parameters
149typedef struct {
150  int simple_;                  // 0=complex, 1=simple
151  int level_;                   // [0..63]
152  int sharpness_;               // [0..7]
153  int use_lf_delta_;
154  int ref_lf_delta_[NUM_REF_LF_DELTAS];
155  int mode_lf_delta_[NUM_MODE_LF_DELTAS];
156} VP8FilterHeader;
157
158//------------------------------------------------------------------------------
159// Informations about the macroblocks.
160
161typedef struct {  // filter specs
162  uint8_t f_limit_;      // filter limit in [3..189], or 0 if no filtering
163  uint8_t f_ilevel_;     // inner limit in [1..63]
164  uint8_t f_inner_;      // do inner filtering?
165  uint8_t hev_thresh_;   // high edge variance threshold in [0..2]
166} VP8FInfo;
167
168typedef struct {  // Top/Left Contexts used for syntax-parsing
169  uint8_t nz_;        // non-zero AC/DC coeffs (4bit for luma + 4bit for chroma)
170  uint8_t nz_dc_;     // non-zero DC coeff (1bit)
171} VP8MB;
172
173// Dequantization matrices
174typedef int quant_t[2];      // [DC / AC].  Can be 'uint16_t[2]' too (~slower).
175typedef struct {
176  quant_t y1_mat_, y2_mat_, uv_mat_;
177
178  int uv_quant_;   // U/V quantizer value
179  int dither_;     // dithering amplitude (0 = off, max=255)
180} VP8QuantMatrix;
181
182// Data needed to reconstruct a macroblock
183typedef struct {
184  int16_t coeffs_[384];   // 384 coeffs = (16+4+4) * 4*4
185  uint8_t is_i4x4_;       // true if intra4x4
186  uint8_t imodes_[16];    // one 16x16 mode (#0) or sixteen 4x4 modes
187  uint8_t uvmode_;        // chroma prediction mode
188  // bit-wise info about the content of each sub-4x4 blocks (in decoding order).
189  // Each of the 4x4 blocks for y/u/v is associated with a 2b code according to:
190  //   code=0 -> no coefficient
191  //   code=1 -> only DC
192  //   code=2 -> first three coefficients are non-zero
193  //   code=3 -> more than three coefficients are non-zero
194  // This allows to call specialized transform functions.
195  uint32_t non_zero_y_;
196  uint32_t non_zero_uv_;
197  uint8_t dither_;      // local dithering strength (deduced from non_zero_*)
198  uint8_t skip_;
199  uint8_t segment_;
200} VP8MBData;
201
202// Persistent information needed by the parallel processing
203typedef struct {
204  int id_;              // cache row to process (in [0..2])
205  int mb_y_;            // macroblock position of the row
206  int filter_row_;      // true if row-filtering is needed
207  VP8FInfo* f_info_;    // filter strengths (swapped with dec->f_info_)
208  VP8MBData* mb_data_;  // reconstruction data (swapped with dec->mb_data_)
209  VP8Io io_;            // copy of the VP8Io to pass to put()
210} VP8ThreadContext;
211
212// Saved top samples, per macroblock. Fits into a cache-line.
213typedef struct {
214  uint8_t y[16], u[8], v[8];
215} VP8TopSamples;
216
217//------------------------------------------------------------------------------
218// VP8Decoder: the main opaque structure handed over to user
219
220struct VP8Decoder {
221  VP8StatusCode status_;
222  int ready_;     // true if ready to decode a picture with VP8Decode()
223  const char* error_msg_;  // set when status_ is not OK.
224
225  // Main data source
226  VP8BitReader br_;
227
228  // headers
229  VP8FrameHeader   frm_hdr_;
230  VP8PictureHeader pic_hdr_;
231  VP8FilterHeader  filter_hdr_;
232  VP8SegmentHeader segment_hdr_;
233
234  // Worker
235  WebPWorker worker_;
236  int mt_method_;      // multi-thread method: 0=off, 1=[parse+recon][filter]
237                       // 2=[parse][recon+filter]
238  int cache_id_;       // current cache row
239  int num_caches_;     // number of cached rows of 16 pixels (1, 2 or 3)
240  VP8ThreadContext thread_ctx_;  // Thread context
241
242  // dimension, in macroblock units.
243  int mb_w_, mb_h_;
244
245  // Macroblock to process/filter, depending on cropping and filter_type.
246  int tl_mb_x_, tl_mb_y_;  // top-left MB that must be in-loop filtered
247  int br_mb_x_, br_mb_y_;  // last bottom-right MB that must be decoded
248
249  // number of partitions.
250  int num_parts_;
251  // per-partition boolean decoders.
252  VP8BitReader parts_[MAX_NUM_PARTITIONS];
253
254  // Dithering strength, deduced from decoding options
255  int dither_;                // whether to use dithering or not
256  VP8Random dithering_rg_;    // random generator for dithering
257
258  // dequantization (one set of DC/AC dequant factor per segment)
259  VP8QuantMatrix dqm_[NUM_MB_SEGMENTS];
260
261  // probabilities
262  VP8Proba proba_;
263  int use_skip_proba_;
264  uint8_t skip_p_;
265
266  // Boundary data cache and persistent buffers.
267  uint8_t* intra_t_;      // top intra modes values: 4 * mb_w_
268  uint8_t  intra_l_[4];   // left intra modes values
269
270  VP8TopSamples* yuv_t_;  // top y/u/v samples
271
272  VP8MB* mb_info_;        // contextual macroblock info (mb_w_ + 1)
273  VP8FInfo* f_info_;      // filter strength info
274  uint8_t* yuv_b_;        // main block for Y/U/V (size = YUV_SIZE)
275
276  uint8_t* cache_y_;      // macroblock row for storing unfiltered samples
277  uint8_t* cache_u_;
278  uint8_t* cache_v_;
279  int cache_y_stride_;
280  int cache_uv_stride_;
281
282  // main memory chunk for the above data. Persistent.
283  void* mem_;
284  size_t mem_size_;
285
286  // Per macroblock non-persistent infos.
287  int mb_x_, mb_y_;       // current position, in macroblock units
288  VP8MBData* mb_data_;    // parsed reconstruction data
289
290  // Filtering side-info
291  int filter_type_;                          // 0=off, 1=simple, 2=complex
292  VP8FInfo fstrengths_[NUM_MB_SEGMENTS][2];  // precalculated per-segment/type
293
294  // Alpha
295  struct ALPHDecoder* alph_dec_;  // alpha-plane decoder object
296  const uint8_t* alpha_data_;     // compressed alpha data (if present)
297  size_t alpha_data_size_;
298  int is_alpha_decoded_;  // true if alpha_data_ is decoded in alpha_plane_
299  uint8_t* alpha_plane_;  // output. Persistent, contains the whole data.
300  int alpha_dithering_;   // derived from decoding options (0=off, 100=full).
301};
302
303//------------------------------------------------------------------------------
304// internal functions. Not public.
305
306// in vp8.c
307int VP8SetError(VP8Decoder* const dec,
308                VP8StatusCode error, const char* const msg);
309
310// in tree.c
311void VP8ResetProba(VP8Proba* const proba);
312void VP8ParseProba(VP8BitReader* const br, VP8Decoder* const dec);
313// parses one row of intra mode data in partition 0, returns !eof
314int VP8ParseIntraModeRow(VP8BitReader* const br, VP8Decoder* const dec);
315
316// in quant.c
317void VP8ParseQuant(VP8Decoder* const dec);
318
319// in frame.c
320int VP8InitFrame(VP8Decoder* const dec, VP8Io* io);
321// Call io->setup() and finish setting up scan parameters.
322// After this call returns, one must always call VP8ExitCritical() with the
323// same parameters. Both functions should be used in pair. Returns VP8_STATUS_OK
324// if ok, otherwise sets and returns the error status on *dec.
325VP8StatusCode VP8EnterCritical(VP8Decoder* const dec, VP8Io* const io);
326// Must always be called in pair with VP8EnterCritical().
327// Returns false in case of error.
328int VP8ExitCritical(VP8Decoder* const dec, VP8Io* const io);
329// Return the multi-threading method to use (0=off), depending
330// on options and bitstream size. Only for lossy decoding.
331int VP8GetThreadMethod(const WebPDecoderOptions* const options,
332                       const WebPHeaderStructure* const headers,
333                       int width, int height);
334// Initialize dithering post-process if needed.
335void VP8InitDithering(const WebPDecoderOptions* const options,
336                      VP8Decoder* const dec);
337// Process the last decoded row (filtering + output).
338int VP8ProcessRow(VP8Decoder* const dec, VP8Io* const io);
339// To be called at the start of a new scanline, to initialize predictors.
340void VP8InitScanline(VP8Decoder* const dec);
341// Decode one macroblock. Returns false if there is not enough data.
342int VP8DecodeMB(VP8Decoder* const dec, VP8BitReader* const token_br);
343
344// in alpha.c
345const uint8_t* VP8DecompressAlphaRows(VP8Decoder* const dec,
346                                      int row, int num_rows);
347
348//------------------------------------------------------------------------------
349
350#ifdef __cplusplus
351}    // extern "C"
352#endif
353
354#endif  /* WEBP_DEC_VP8I_H_ */
355