1// Copyright 2011 Google Inc. All Rights Reserved.
2//
3// Use of this source code is governed by a BSD-style license
4// that can be found in the COPYING file in the root of the source
5// tree. An additional intellectual property rights grant can be found
6// in the file PATENTS. All contributing project authors may
7// be found in the AUTHORS file in the root of the source tree.
8// -----------------------------------------------------------------------------
9//
10// WebPPicture utils: colorspace conversion, crop, ...
11//
12// Author: Skal (pascal.massimino@gmail.com)
13
14#include <assert.h>
15#include <stdlib.h>
16#include <math.h>
17
18#include "./vp8enci.h"
19#include "../utils/rescaler.h"
20#include "../utils/utils.h"
21#include "../dsp/dsp.h"
22#include "../dsp/yuv.h"
23
24#if defined(__cplusplus) || defined(c_plusplus)
25extern "C" {
26#endif
27
28#define HALVE(x) (((x) + 1) >> 1)
29#define IS_YUV_CSP(csp, YUV_CSP) (((csp) & WEBP_CSP_UV_MASK) == (YUV_CSP))
30
31static const union {
32  uint32_t argb;
33  uint8_t  bytes[4];
34} test_endian = { 0xff000000u };
35#define ALPHA_IS_LAST (test_endian.bytes[3] == 0xff)
36
37//------------------------------------------------------------------------------
38// WebPPicture
39//------------------------------------------------------------------------------
40
41int WebPPictureAlloc(WebPPicture* picture) {
42  if (picture != NULL) {
43    const WebPEncCSP uv_csp = picture->colorspace & WEBP_CSP_UV_MASK;
44    const int has_alpha = picture->colorspace & WEBP_CSP_ALPHA_BIT;
45    const int width = picture->width;
46    const int height = picture->height;
47
48    if (!picture->use_argb) {
49      const int y_stride = width;
50      const int uv_width = HALVE(width);
51      const int uv_height = HALVE(height);
52      const int uv_stride = uv_width;
53      int uv0_stride = 0;
54      int a_width, a_stride;
55      uint64_t y_size, uv_size, uv0_size, a_size, total_size;
56      uint8_t* mem;
57
58      // U/V
59      switch (uv_csp) {
60        case WEBP_YUV420:
61          break;
62#ifdef WEBP_EXPERIMENTAL_FEATURES
63        case WEBP_YUV400:    // for now, we'll just reset the U/V samples
64          break;
65        case WEBP_YUV422:
66          uv0_stride = uv_width;
67          break;
68        case WEBP_YUV444:
69          uv0_stride = width;
70          break;
71#endif
72        default:
73          return 0;
74      }
75      uv0_size = height * uv0_stride;
76
77      // alpha
78      a_width = has_alpha ? width : 0;
79      a_stride = a_width;
80      y_size = (uint64_t)y_stride * height;
81      uv_size = (uint64_t)uv_stride * uv_height;
82      a_size =  (uint64_t)a_stride * height;
83
84      total_size = y_size + a_size + 2 * uv_size + 2 * uv0_size;
85
86      // Security and validation checks
87      if (width <= 0 || height <= 0 ||         // luma/alpha param error
88          uv_width < 0 || uv_height < 0) {     // u/v param error
89        return 0;
90      }
91      // Clear previous buffer and allocate a new one.
92      WebPPictureFree(picture);   // erase previous buffer
93      mem = (uint8_t*)WebPSafeMalloc(total_size, sizeof(*mem));
94      if (mem == NULL) return 0;
95
96      // From now on, we're in the clear, we can no longer fail...
97      picture->memory_ = (void*)mem;
98      picture->y_stride  = y_stride;
99      picture->uv_stride = uv_stride;
100      picture->a_stride  = a_stride;
101      picture->uv0_stride = uv0_stride;
102      // TODO(skal): we could align the y/u/v planes and adjust stride.
103      picture->y = mem;
104      mem += y_size;
105
106      picture->u = mem;
107      mem += uv_size;
108      picture->v = mem;
109      mem += uv_size;
110
111      if (a_size) {
112        picture->a = mem;
113        mem += a_size;
114      }
115      if (uv0_size) {
116        picture->u0 = mem;
117        mem += uv0_size;
118        picture->v0 = mem;
119        mem += uv0_size;
120      }
121    } else {
122      void* memory;
123      const uint64_t argb_size = (uint64_t)width * height;
124      if (width <= 0 || height <= 0) {
125        return 0;
126      }
127      // Clear previous buffer and allocate a new one.
128      WebPPictureFree(picture);   // erase previous buffer
129      memory = WebPSafeMalloc(argb_size, sizeof(*picture->argb));
130      if (memory == NULL) return 0;
131
132      // TODO(skal): align plane to cache line?
133      picture->memory_argb_ = memory;
134      picture->argb = (uint32_t*)memory;
135      picture->argb_stride = width;
136    }
137  }
138  return 1;
139}
140
141// Remove reference to the ARGB buffer (doesn't free anything).
142static void PictureResetARGB(WebPPicture* const picture) {
143  picture->memory_argb_ = NULL;
144  picture->argb = NULL;
145  picture->argb_stride = 0;
146}
147
148// Remove reference to the YUVA buffer (doesn't free anything).
149static void PictureResetYUVA(WebPPicture* const picture) {
150  picture->memory_ = NULL;
151  picture->y = picture->u = picture->v = picture->a = NULL;
152  picture->u0 = picture->v0 = NULL;
153  picture->y_stride = picture->uv_stride = 0;
154  picture->a_stride = 0;
155  picture->uv0_stride = 0;
156}
157
158// Grab the 'specs' (writer, *opaque, width, height...) from 'src' and copy them
159// into 'dst'. Mark 'dst' as not owning any memory.
160static void WebPPictureGrabSpecs(const WebPPicture* const src,
161                                 WebPPicture* const dst) {
162  assert(src != NULL && dst != NULL);
163  *dst = *src;
164  PictureResetYUVA(dst);
165  PictureResetARGB(dst);
166}
167
168// Allocate a new argb buffer, discarding any existing one and preserving
169// the other YUV(A) buffer.
170static int PictureAllocARGB(WebPPicture* const picture) {
171  WebPPicture tmp;
172  free(picture->memory_argb_);
173  PictureResetARGB(picture);
174  picture->use_argb = 1;
175  WebPPictureGrabSpecs(picture, &tmp);
176  if (!WebPPictureAlloc(&tmp)) {
177    return WebPEncodingSetError(picture, VP8_ENC_ERROR_OUT_OF_MEMORY);
178  }
179  picture->memory_argb_ = tmp.memory_argb_;
180  picture->argb = tmp.argb;
181  picture->argb_stride = tmp.argb_stride;
182  return 1;
183}
184
185// Release memory owned by 'picture' (both YUV and ARGB buffers).
186void WebPPictureFree(WebPPicture* picture) {
187  if (picture != NULL) {
188    free(picture->memory_);
189    free(picture->memory_argb_);
190    PictureResetYUVA(picture);
191    PictureResetARGB(picture);
192  }
193}
194
195//------------------------------------------------------------------------------
196// Picture copying
197
198// Not worth moving to dsp/enc.c (only used here).
199static void CopyPlane(const uint8_t* src, int src_stride,
200                      uint8_t* dst, int dst_stride, int width, int height) {
201  while (height-- > 0) {
202    memcpy(dst, src, width);
203    src += src_stride;
204    dst += dst_stride;
205  }
206}
207
208// Adjust top-left corner to chroma sample position.
209static void SnapTopLeftPosition(const WebPPicture* const pic,
210                                int* const left, int* const top) {
211  if (!pic->use_argb) {
212    const int is_yuv422 = IS_YUV_CSP(pic->colorspace, WEBP_YUV422);
213    if (IS_YUV_CSP(pic->colorspace, WEBP_YUV420) || is_yuv422) {
214      *left &= ~1;
215      if (!is_yuv422) *top &= ~1;
216    }
217  }
218}
219
220// Adjust top-left corner and verify that the sub-rectangle is valid.
221static int AdjustAndCheckRectangle(const WebPPicture* const pic,
222                                   int* const left, int* const top,
223                                   int width, int height) {
224  SnapTopLeftPosition(pic, left, top);
225  if ((*left) < 0 || (*top) < 0) return 0;
226  if (width <= 0 || height <= 0) return 0;
227  if ((*left) + width > pic->width) return 0;
228  if ((*top) + height > pic->height) return 0;
229  return 1;
230}
231
232int WebPPictureCopy(const WebPPicture* src, WebPPicture* dst) {
233  if (src == NULL || dst == NULL) return 0;
234  if (src == dst) return 1;
235
236  WebPPictureGrabSpecs(src, dst);
237  if (!WebPPictureAlloc(dst)) return 0;
238
239  if (!src->use_argb) {
240    CopyPlane(src->y, src->y_stride,
241              dst->y, dst->y_stride, dst->width, dst->height);
242    CopyPlane(src->u, src->uv_stride,
243              dst->u, dst->uv_stride, HALVE(dst->width), HALVE(dst->height));
244    CopyPlane(src->v, src->uv_stride,
245              dst->v, dst->uv_stride, HALVE(dst->width), HALVE(dst->height));
246    if (dst->a != NULL)  {
247      CopyPlane(src->a, src->a_stride,
248                dst->a, dst->a_stride, dst->width, dst->height);
249    }
250#ifdef WEBP_EXPERIMENTAL_FEATURES
251    if (dst->u0 != NULL)  {
252      int uv0_width = src->width;
253      if (IS_YUV_CSP(dst->colorspace, WEBP_YUV422)) {
254        uv0_width = HALVE(uv0_width);
255      }
256      CopyPlane(src->u0, src->uv0_stride,
257                dst->u0, dst->uv0_stride, uv0_width, dst->height);
258      CopyPlane(src->v0, src->uv0_stride,
259                dst->v0, dst->uv0_stride, uv0_width, dst->height);
260    }
261#endif
262  } else {
263    CopyPlane((const uint8_t*)src->argb, 4 * src->argb_stride,
264              (uint8_t*)dst->argb, 4 * dst->argb_stride,
265              4 * dst->width, dst->height);
266  }
267  return 1;
268}
269
270int WebPPictureIsView(const WebPPicture* picture) {
271  if (picture == NULL) return 0;
272  if (picture->use_argb) {
273    return (picture->memory_argb_ == NULL);
274  }
275  return (picture->memory_ == NULL);
276}
277
278int WebPPictureView(const WebPPicture* src,
279                    int left, int top, int width, int height,
280                    WebPPicture* dst) {
281  if (src == NULL || dst == NULL) return 0;
282
283  // verify rectangle position.
284  if (!AdjustAndCheckRectangle(src, &left, &top, width, height)) return 0;
285
286  if (src != dst) {  // beware of aliasing! We don't want to leak 'memory_'.
287    WebPPictureGrabSpecs(src, dst);
288  }
289  dst->width = width;
290  dst->height = height;
291  if (!src->use_argb) {
292    dst->y = src->y + top * src->y_stride + left;
293    dst->u = src->u + (top >> 1) * src->uv_stride + (left >> 1);
294    dst->v = src->v + (top >> 1) * src->uv_stride + (left >> 1);
295    dst->y_stride = src->y_stride;
296    dst->uv_stride = src->uv_stride;
297    if (src->a != NULL) {
298      dst->a = src->a + top * src->a_stride + left;
299      dst->a_stride = src->a_stride;
300    }
301#ifdef WEBP_EXPERIMENTAL_FEATURES
302    if (src->u0 != NULL) {
303      const int left_pos =
304          IS_YUV_CSP(dst->colorspace, WEBP_YUV422) ? (left >> 1) : left;
305      dst->u0 = src->u0 + top * src->uv0_stride + left_pos;
306      dst->v0 = src->v0 + top * src->uv0_stride + left_pos;
307      dst->uv0_stride = src->uv0_stride;
308    }
309#endif
310  } else {
311    dst->argb = src->argb + top * src->argb_stride + left;
312    dst->argb_stride = src->argb_stride;
313  }
314  return 1;
315}
316
317//------------------------------------------------------------------------------
318// Picture cropping
319
320int WebPPictureCrop(WebPPicture* pic,
321                    int left, int top, int width, int height) {
322  WebPPicture tmp;
323
324  if (pic == NULL) return 0;
325  if (!AdjustAndCheckRectangle(pic, &left, &top, width, height)) return 0;
326
327  WebPPictureGrabSpecs(pic, &tmp);
328  tmp.width = width;
329  tmp.height = height;
330  if (!WebPPictureAlloc(&tmp)) return 0;
331
332  if (!pic->use_argb) {
333    const int y_offset = top * pic->y_stride + left;
334    const int uv_offset = (top / 2) * pic->uv_stride + left / 2;
335    CopyPlane(pic->y + y_offset, pic->y_stride,
336              tmp.y, tmp.y_stride, width, height);
337    CopyPlane(pic->u + uv_offset, pic->uv_stride,
338              tmp.u, tmp.uv_stride, HALVE(width), HALVE(height));
339    CopyPlane(pic->v + uv_offset, pic->uv_stride,
340              tmp.v, tmp.uv_stride, HALVE(width), HALVE(height));
341
342    if (tmp.a != NULL) {
343      const int a_offset = top * pic->a_stride + left;
344      CopyPlane(pic->a + a_offset, pic->a_stride,
345                tmp.a, tmp.a_stride, width, height);
346    }
347#ifdef WEBP_EXPERIMENTAL_FEATURES
348    if (tmp.u0 != NULL) {
349      int w = width;
350      int left_pos = left;
351      if (IS_YUV_CSP(tmp.colorspace, WEBP_YUV422)) {
352        w = HALVE(w);
353        left_pos = HALVE(left_pos);
354      }
355      CopyPlane(pic->u0 + top * pic->uv0_stride + left_pos, pic->uv0_stride,
356                tmp.u0, tmp.uv0_stride, w, height);
357      CopyPlane(pic->v0 + top * pic->uv0_stride + left_pos, pic->uv0_stride,
358                tmp.v0, tmp.uv0_stride, w, height);
359    }
360#endif
361  } else {
362    const uint8_t* const src =
363        (const uint8_t*)(pic->argb + top * pic->argb_stride + left);
364    CopyPlane(src, pic->argb_stride * 4,
365              (uint8_t*)tmp.argb, tmp.argb_stride * 4,
366              width * 4, height);
367  }
368  WebPPictureFree(pic);
369  *pic = tmp;
370  return 1;
371}
372
373//------------------------------------------------------------------------------
374// Simple picture rescaler
375
376static void RescalePlane(const uint8_t* src,
377                         int src_width, int src_height, int src_stride,
378                         uint8_t* dst,
379                         int dst_width, int dst_height, int dst_stride,
380                         int32_t* const work,
381                         int num_channels) {
382  WebPRescaler rescaler;
383  int y = 0;
384  WebPRescalerInit(&rescaler, src_width, src_height,
385                   dst, dst_width, dst_height, dst_stride,
386                   num_channels,
387                   src_width, dst_width,
388                   src_height, dst_height,
389                   work);
390  memset(work, 0, 2 * dst_width * num_channels * sizeof(*work));
391  while (y < src_height) {
392    y += WebPRescalerImport(&rescaler, src_height - y,
393                            src + y * src_stride, src_stride);
394    WebPRescalerExport(&rescaler);
395  }
396}
397
398int WebPPictureRescale(WebPPicture* pic, int width, int height) {
399  WebPPicture tmp;
400  int prev_width, prev_height;
401  int32_t* work;
402
403  if (pic == NULL) return 0;
404  prev_width = pic->width;
405  prev_height = pic->height;
406  // if width is unspecified, scale original proportionally to height ratio.
407  if (width == 0) {
408    width = (prev_width * height + prev_height / 2) / prev_height;
409  }
410  // if height is unspecified, scale original proportionally to width ratio.
411  if (height == 0) {
412    height = (prev_height * width + prev_width / 2) / prev_width;
413  }
414  // Check if the overall dimensions still make sense.
415  if (width <= 0 || height <= 0) return 0;
416
417  WebPPictureGrabSpecs(pic, &tmp);
418  tmp.width = width;
419  tmp.height = height;
420  if (!WebPPictureAlloc(&tmp)) return 0;
421
422  if (!pic->use_argb) {
423    work = (int32_t*)WebPSafeMalloc(2ULL * width, sizeof(*work));
424    if (work == NULL) {
425      WebPPictureFree(&tmp);
426      return 0;
427    }
428
429    RescalePlane(pic->y, prev_width, prev_height, pic->y_stride,
430                 tmp.y, width, height, tmp.y_stride, work, 1);
431    RescalePlane(pic->u,
432                 HALVE(prev_width), HALVE(prev_height), pic->uv_stride,
433                 tmp.u,
434                 HALVE(width), HALVE(height), tmp.uv_stride, work, 1);
435    RescalePlane(pic->v,
436                 HALVE(prev_width), HALVE(prev_height), pic->uv_stride,
437                 tmp.v,
438                 HALVE(width), HALVE(height), tmp.uv_stride, work, 1);
439
440    if (tmp.a != NULL) {
441      RescalePlane(pic->a, prev_width, prev_height, pic->a_stride,
442                   tmp.a, width, height, tmp.a_stride, work, 1);
443    }
444#ifdef WEBP_EXPERIMENTAL_FEATURES
445    if (tmp.u0 != NULL) {
446      const int s = IS_YUV_CSP(tmp.colorspace, WEBP_YUV422) ? 2 : 1;
447      RescalePlane(
448          pic->u0, (prev_width + s / 2) / s, prev_height, pic->uv0_stride,
449          tmp.u0, (width + s / 2) / s, height, tmp.uv0_stride, work, 1);
450      RescalePlane(
451          pic->v0, (prev_width + s / 2) / s, prev_height, pic->uv0_stride,
452          tmp.v0, (width + s / 2) / s, height, tmp.uv0_stride, work, 1);
453    }
454#endif
455  } else {
456    work = (int32_t*)WebPSafeMalloc(2ULL * width * 4, sizeof(*work));
457    if (work == NULL) {
458      WebPPictureFree(&tmp);
459      return 0;
460    }
461
462    RescalePlane((const uint8_t*)pic->argb, prev_width, prev_height,
463                 pic->argb_stride * 4,
464                 (uint8_t*)tmp.argb, width, height,
465                 tmp.argb_stride * 4,
466                 work, 4);
467  }
468  WebPPictureFree(pic);
469  free(work);
470  *pic = tmp;
471  return 1;
472}
473
474//------------------------------------------------------------------------------
475// WebPMemoryWriter: Write-to-memory
476
477void WebPMemoryWriterInit(WebPMemoryWriter* writer) {
478  writer->mem = NULL;
479  writer->size = 0;
480  writer->max_size = 0;
481}
482
483int WebPMemoryWrite(const uint8_t* data, size_t data_size,
484                    const WebPPicture* picture) {
485  WebPMemoryWriter* const w = (WebPMemoryWriter*)picture->custom_ptr;
486  uint64_t next_size;
487  if (w == NULL) {
488    return 1;
489  }
490  next_size = (uint64_t)w->size + data_size;
491  if (next_size > w->max_size) {
492    uint8_t* new_mem;
493    uint64_t next_max_size = 2ULL * w->max_size;
494    if (next_max_size < next_size) next_max_size = next_size;
495    if (next_max_size < 8192ULL) next_max_size = 8192ULL;
496    new_mem = (uint8_t*)WebPSafeMalloc(next_max_size, 1);
497    if (new_mem == NULL) {
498      return 0;
499    }
500    if (w->size > 0) {
501      memcpy(new_mem, w->mem, w->size);
502    }
503    free(w->mem);
504    w->mem = new_mem;
505    // down-cast is ok, thanks to WebPSafeMalloc
506    w->max_size = (size_t)next_max_size;
507  }
508  if (data_size > 0) {
509    memcpy(w->mem + w->size, data, data_size);
510    w->size += data_size;
511  }
512  return 1;
513}
514
515//------------------------------------------------------------------------------
516// Detection of non-trivial transparency
517
518// Returns true if alpha[] has non-0xff values.
519static int CheckNonOpaque(const uint8_t* alpha, int width, int height,
520                          int x_step, int y_step) {
521  if (alpha == NULL) return 0;
522  while (height-- > 0) {
523    int x;
524    for (x = 0; x < width * x_step; x += x_step) {
525      if (alpha[x] != 0xff) return 1;  // TODO(skal): check 4/8 bytes at a time.
526    }
527    alpha += y_step;
528  }
529  return 0;
530}
531
532// Checking for the presence of non-opaque alpha.
533int WebPPictureHasTransparency(const WebPPicture* picture) {
534  if (picture == NULL) return 0;
535  if (!picture->use_argb) {
536    return CheckNonOpaque(picture->a, picture->width, picture->height,
537                          1, picture->a_stride);
538  } else {
539    int x, y;
540    const uint32_t* argb = picture->argb;
541    if (argb == NULL) return 0;
542    for (y = 0; y < picture->height; ++y) {
543      for (x = 0; x < picture->width; ++x) {
544        if (argb[x] < 0xff000000u) return 1;   // test any alpha values != 0xff
545      }
546      argb += picture->argb_stride;
547    }
548  }
549  return 0;
550}
551
552//------------------------------------------------------------------------------
553// RGB -> YUV conversion
554
555// TODO: we can do better than simply 2x2 averaging on U/V samples.
556#define SUM4(ptr) ((ptr)[0] + (ptr)[step] + \
557                   (ptr)[rgb_stride] + (ptr)[rgb_stride + step])
558#define SUM2H(ptr) (2 * (ptr)[0] + 2 * (ptr)[step])
559#define SUM2V(ptr) (2 * (ptr)[0] + 2 * (ptr)[rgb_stride])
560#define SUM1(ptr)  (4 * (ptr)[0])
561#define RGB_TO_UV(x, y, SUM) {                           \
562  const int src = (2 * (step * (x) + (y) * rgb_stride)); \
563  const int dst = (x) + (y) * picture->uv_stride;        \
564  const int r = SUM(r_ptr + src);                        \
565  const int g = SUM(g_ptr + src);                        \
566  const int b = SUM(b_ptr + src);                        \
567  picture->u[dst] = VP8RGBToU(r, g, b);                  \
568  picture->v[dst] = VP8RGBToV(r, g, b);                  \
569}
570
571#define RGB_TO_UV0(x_in, x_out, y, SUM) {                \
572  const int src = (step * (x_in) + (y) * rgb_stride);    \
573  const int dst = (x_out) + (y) * picture->uv0_stride;   \
574  const int r = SUM(r_ptr + src);                        \
575  const int g = SUM(g_ptr + src);                        \
576  const int b = SUM(b_ptr + src);                        \
577  picture->u0[dst] = VP8RGBToU(r, g, b);                 \
578  picture->v0[dst] = VP8RGBToV(r, g, b);                 \
579}
580
581static void MakeGray(WebPPicture* const picture) {
582  int y;
583  const int uv_width = HALVE(picture->width);
584  const int uv_height = HALVE(picture->height);
585  for (y = 0; y < uv_height; ++y) {
586    memset(picture->u + y * picture->uv_stride, 128, uv_width);
587    memset(picture->v + y * picture->uv_stride, 128, uv_width);
588  }
589}
590
591static int ImportYUVAFromRGBA(const uint8_t* const r_ptr,
592                              const uint8_t* const g_ptr,
593                              const uint8_t* const b_ptr,
594                              const uint8_t* const a_ptr,
595                              int step,         // bytes per pixel
596                              int rgb_stride,   // bytes per scanline
597                              WebPPicture* const picture) {
598  const WebPEncCSP uv_csp = picture->colorspace & WEBP_CSP_UV_MASK;
599  int x, y;
600  const int width = picture->width;
601  const int height = picture->height;
602  const int has_alpha = CheckNonOpaque(a_ptr, width, height, step, rgb_stride);
603
604  picture->colorspace = uv_csp;
605  picture->use_argb = 0;
606  if (has_alpha) {
607    picture->colorspace |= WEBP_CSP_ALPHA_BIT;
608  }
609  if (!WebPPictureAlloc(picture)) return 0;
610
611  // Import luma plane
612  for (y = 0; y < height; ++y) {
613    for (x = 0; x < width; ++x) {
614      const int offset = step * x + y * rgb_stride;
615      picture->y[x + y * picture->y_stride] =
616          VP8RGBToY(r_ptr[offset], g_ptr[offset], b_ptr[offset]);
617    }
618  }
619
620  // Downsample U/V plane
621  if (uv_csp != WEBP_YUV400) {
622    for (y = 0; y < (height >> 1); ++y) {
623      for (x = 0; x < (width >> 1); ++x) {
624        RGB_TO_UV(x, y, SUM4);
625      }
626      if (width & 1) {
627        RGB_TO_UV(x, y, SUM2V);
628      }
629    }
630    if (height & 1) {
631      for (x = 0; x < (width >> 1); ++x) {
632        RGB_TO_UV(x, y, SUM2H);
633      }
634      if (width & 1) {
635        RGB_TO_UV(x, y, SUM1);
636      }
637    }
638
639#ifdef WEBP_EXPERIMENTAL_FEATURES
640    // Store original U/V samples too
641    if (uv_csp == WEBP_YUV422) {
642      for (y = 0; y < height; ++y) {
643        for (x = 0; x < (width >> 1); ++x) {
644          RGB_TO_UV0(2 * x, x, y, SUM2H);
645        }
646        if (width & 1) {
647          RGB_TO_UV0(2 * x, x, y, SUM1);
648        }
649      }
650    } else if (uv_csp == WEBP_YUV444) {
651      for (y = 0; y < height; ++y) {
652        for (x = 0; x < width; ++x) {
653          RGB_TO_UV0(x, x, y, SUM1);
654        }
655      }
656    }
657#endif
658  } else {
659    MakeGray(picture);
660  }
661
662  if (has_alpha) {
663    assert(step >= 4);
664    for (y = 0; y < height; ++y) {
665      for (x = 0; x < width; ++x) {
666        picture->a[x + y * picture->a_stride] =
667            a_ptr[step * x + y * rgb_stride];
668      }
669    }
670  }
671  return 1;
672}
673
674static int Import(WebPPicture* const picture,
675                  const uint8_t* const rgb, int rgb_stride,
676                  int step, int swap_rb, int import_alpha) {
677  const uint8_t* const r_ptr = rgb + (swap_rb ? 2 : 0);
678  const uint8_t* const g_ptr = rgb + 1;
679  const uint8_t* const b_ptr = rgb + (swap_rb ? 0 : 2);
680  const uint8_t* const a_ptr = import_alpha ? rgb + 3 : NULL;
681  const int width = picture->width;
682  const int height = picture->height;
683
684  if (!picture->use_argb) {
685    return ImportYUVAFromRGBA(r_ptr, g_ptr, b_ptr, a_ptr, step, rgb_stride,
686                              picture);
687  }
688  if (import_alpha) {
689    picture->colorspace |= WEBP_CSP_ALPHA_BIT;
690  } else {
691    picture->colorspace &= ~WEBP_CSP_ALPHA_BIT;
692  }
693  if (!WebPPictureAlloc(picture)) return 0;
694
695  if (!import_alpha) {
696    int x, y;
697    for (y = 0; y < height; ++y) {
698      for (x = 0; x < width; ++x) {
699        const int offset = step * x + y * rgb_stride;
700        const uint32_t argb =
701            0xff000000u |
702            (r_ptr[offset] << 16) |
703            (g_ptr[offset] <<  8) |
704            (b_ptr[offset]);
705        picture->argb[x + y * picture->argb_stride] = argb;
706      }
707    }
708  } else {
709    int x, y;
710    assert(step >= 4);
711    for (y = 0; y < height; ++y) {
712      for (x = 0; x < width; ++x) {
713        const int offset = step * x + y * rgb_stride;
714        const uint32_t argb = ((uint32_t)a_ptr[offset] << 24) |
715                              (r_ptr[offset] << 16) |
716                              (g_ptr[offset] <<  8) |
717                              (b_ptr[offset]);
718        picture->argb[x + y * picture->argb_stride] = argb;
719      }
720    }
721  }
722  return 1;
723}
724#undef SUM4
725#undef SUM2V
726#undef SUM2H
727#undef SUM1
728#undef RGB_TO_UV
729
730int WebPPictureImportRGB(WebPPicture* picture,
731                         const uint8_t* rgb, int rgb_stride) {
732  return Import(picture, rgb, rgb_stride, 3, 0, 0);
733}
734
735int WebPPictureImportBGR(WebPPicture* picture,
736                         const uint8_t* rgb, int rgb_stride) {
737  return Import(picture, rgb, rgb_stride, 3, 1, 0);
738}
739
740int WebPPictureImportRGBA(WebPPicture* picture,
741                          const uint8_t* rgba, int rgba_stride) {
742  return Import(picture, rgba, rgba_stride, 4, 0, 1);
743}
744
745int WebPPictureImportBGRA(WebPPicture* picture,
746                          const uint8_t* rgba, int rgba_stride) {
747  return Import(picture, rgba, rgba_stride, 4, 1, 1);
748}
749
750int WebPPictureImportRGBX(WebPPicture* picture,
751                          const uint8_t* rgba, int rgba_stride) {
752  return Import(picture, rgba, rgba_stride, 4, 0, 0);
753}
754
755int WebPPictureImportBGRX(WebPPicture* picture,
756                          const uint8_t* rgba, int rgba_stride) {
757  return Import(picture, rgba, rgba_stride, 4, 1, 0);
758}
759
760//------------------------------------------------------------------------------
761// Automatic YUV <-> ARGB conversions.
762
763int WebPPictureYUVAToARGB(WebPPicture* picture) {
764  if (picture == NULL) return 0;
765  if (picture->memory_ == NULL || picture->y == NULL ||
766      picture->u == NULL || picture->v == NULL) {
767    return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
768  }
769  if ((picture->colorspace & WEBP_CSP_ALPHA_BIT) && picture->a == NULL) {
770    return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
771  }
772  if ((picture->colorspace & WEBP_CSP_UV_MASK) != WEBP_YUV420) {
773    return WebPEncodingSetError(picture, VP8_ENC_ERROR_INVALID_CONFIGURATION);
774  }
775  // Allocate a new argb buffer (discarding the previous one).
776  if (!PictureAllocARGB(picture)) return 0;
777
778  // Convert
779  {
780    int y;
781    const int width = picture->width;
782    const int height = picture->height;
783    const int argb_stride = 4 * picture->argb_stride;
784    uint8_t* dst = (uint8_t*)picture->argb;
785    const uint8_t *cur_u = picture->u, *cur_v = picture->v, *cur_y = picture->y;
786    WebPUpsampleLinePairFunc upsample = WebPGetLinePairConverter(ALPHA_IS_LAST);
787
788    // First row, with replicated top samples.
789    upsample(NULL, cur_y, cur_u, cur_v, cur_u, cur_v, NULL, dst, width);
790    cur_y += picture->y_stride;
791    dst += argb_stride;
792    // Center rows.
793    for (y = 1; y + 1 < height; y += 2) {
794      const uint8_t* const top_u = cur_u;
795      const uint8_t* const top_v = cur_v;
796      cur_u += picture->uv_stride;
797      cur_v += picture->uv_stride;
798      upsample(cur_y, cur_y + picture->y_stride, top_u, top_v, cur_u, cur_v,
799               dst, dst + argb_stride, width);
800      cur_y += 2 * picture->y_stride;
801      dst += 2 * argb_stride;
802    }
803    // Last row (if needed), with replicated bottom samples.
804    if (height > 1 && !(height & 1)) {
805      upsample(cur_y, NULL, cur_u, cur_v, cur_u, cur_v, dst, NULL, width);
806    }
807    // Insert alpha values if needed, in replacement for the default 0xff ones.
808    if (picture->colorspace & WEBP_CSP_ALPHA_BIT) {
809      for (y = 0; y < height; ++y) {
810        uint32_t* const argb_dst = picture->argb + y * picture->argb_stride;
811        const uint8_t* const src = picture->a + y * picture->a_stride;
812        int x;
813        for (x = 0; x < width; ++x) {
814          argb_dst[x] = (argb_dst[x] & 0x00ffffffu) | ((uint32_t)src[x] << 24);
815        }
816      }
817    }
818  }
819  return 1;
820}
821
822int WebPPictureARGBToYUVA(WebPPicture* picture, WebPEncCSP colorspace) {
823  if (picture == NULL) return 0;
824  if (picture->argb == NULL) {
825    return WebPEncodingSetError(picture, VP8_ENC_ERROR_NULL_PARAMETER);
826  } else {
827    const uint8_t* const argb = (const uint8_t*)picture->argb;
828    const uint8_t* const r = ALPHA_IS_LAST ? argb + 2 : argb + 1;
829    const uint8_t* const g = ALPHA_IS_LAST ? argb + 1 : argb + 2;
830    const uint8_t* const b = ALPHA_IS_LAST ? argb + 0 : argb + 3;
831    const uint8_t* const a = ALPHA_IS_LAST ? argb + 3 : argb + 0;
832    // We work on a tmp copy of 'picture', because ImportYUVAFromRGBA()
833    // would be calling WebPPictureFree(picture) otherwise.
834    WebPPicture tmp = *picture;
835    PictureResetARGB(&tmp);  // reset ARGB buffer so that it's not free()'d.
836    tmp.use_argb = 0;
837    tmp.colorspace = colorspace & WEBP_CSP_UV_MASK;
838    if (!ImportYUVAFromRGBA(r, g, b, a, 4, 4 * picture->argb_stride, &tmp)) {
839      return WebPEncodingSetError(picture, VP8_ENC_ERROR_OUT_OF_MEMORY);
840    }
841    // Copy back the YUV specs into 'picture'.
842    tmp.argb = picture->argb;
843    tmp.argb_stride = picture->argb_stride;
844    tmp.memory_argb_ = picture->memory_argb_;
845    *picture = tmp;
846  }
847  return 1;
848}
849
850//------------------------------------------------------------------------------
851// Helper: clean up fully transparent area to help compressibility.
852
853#define SIZE 8
854#define SIZE2 (SIZE / 2)
855static int is_transparent_area(const uint8_t* ptr, int stride, int size) {
856  int y, x;
857  for (y = 0; y < size; ++y) {
858    for (x = 0; x < size; ++x) {
859      if (ptr[x]) {
860        return 0;
861      }
862    }
863    ptr += stride;
864  }
865  return 1;
866}
867
868static WEBP_INLINE void flatten(uint8_t* ptr, int v, int stride, int size) {
869  int y;
870  for (y = 0; y < size; ++y) {
871    memset(ptr, v, size);
872    ptr += stride;
873  }
874}
875
876void WebPCleanupTransparentArea(WebPPicture* pic) {
877  int x, y, w, h;
878  const uint8_t* a_ptr;
879  int values[3] = { 0 };
880
881  if (pic == NULL) return;
882
883  a_ptr = pic->a;
884  if (a_ptr == NULL) return;    // nothing to do
885
886  w = pic->width / SIZE;
887  h = pic->height / SIZE;
888  for (y = 0; y < h; ++y) {
889    int need_reset = 1;
890    for (x = 0; x < w; ++x) {
891      const int off_a = (y * pic->a_stride + x) * SIZE;
892      const int off_y = (y * pic->y_stride + x) * SIZE;
893      const int off_uv = (y * pic->uv_stride + x) * SIZE2;
894      if (is_transparent_area(a_ptr + off_a, pic->a_stride, SIZE)) {
895        if (need_reset) {
896          values[0] = pic->y[off_y];
897          values[1] = pic->u[off_uv];
898          values[2] = pic->v[off_uv];
899          need_reset = 0;
900        }
901        flatten(pic->y + off_y, values[0], pic->y_stride, SIZE);
902        flatten(pic->u + off_uv, values[1], pic->uv_stride, SIZE2);
903        flatten(pic->v + off_uv, values[2], pic->uv_stride, SIZE2);
904      } else {
905        need_reset = 1;
906      }
907    }
908    // ignore the left-overs on right/bottom
909  }
910}
911
912#undef SIZE
913#undef SIZE2
914
915//------------------------------------------------------------------------------
916// local-min distortion
917//
918// For every pixel in the *reference* picture, we search for the local best
919// match in the compressed image. This is not a symmetrical measure.
920
921// search radius. Shouldn't be too large.
922#define RADIUS 2
923
924static float AccumulateLSIM(const uint8_t* src, int src_stride,
925                            const uint8_t* ref, int ref_stride,
926                            int w, int h) {
927  int x, y;
928  double total_sse = 0.;
929  for (y = 0; y < h; ++y) {
930    const int y_0 = (y - RADIUS < 0) ? 0 : y - RADIUS;
931    const int y_1 = (y + RADIUS + 1 >= h) ? h : y + RADIUS + 1;
932    for (x = 0; x < w; ++x) {
933      const int x_0 = (x - RADIUS < 0) ? 0 : x - RADIUS;
934      const int x_1 = (x + RADIUS + 1 >= w) ? w : x + RADIUS + 1;
935      double best_sse = 255. * 255.;
936      const double value = (double)ref[y * ref_stride + x];
937      int i, j;
938      for (j = y_0; j < y_1; ++j) {
939        const uint8_t* s = src + j * src_stride;
940        for (i = x_0; i < x_1; ++i) {
941          const double sse = (double)(s[i] - value) * (s[i] - value);
942          if (sse < best_sse) best_sse = sse;
943        }
944      }
945      total_sse += best_sse;
946    }
947  }
948  return (float)total_sse;
949}
950#undef RADIUS
951
952//------------------------------------------------------------------------------
953// Distortion
954
955// Max value returned in case of exact similarity.
956static const double kMinDistortion_dB = 99.;
957static float GetPSNR(const double v) {
958  return (float)((v > 0.) ? -4.3429448 * log(v / (255 * 255.))
959                          : kMinDistortion_dB);
960}
961
962int WebPPictureDistortion(const WebPPicture* src, const WebPPicture* ref,
963                          int type, float result[5]) {
964  DistoStats stats[5];
965  int has_alpha;
966  int uv_w, uv_h;
967
968  if (src == NULL || ref == NULL ||
969      src->width != ref->width || src->height != ref->height ||
970      src->y == NULL || ref->y == NULL ||
971      src->u == NULL || ref->u == NULL ||
972      src->v == NULL || ref->v == NULL ||
973      result == NULL) {
974    return 0;
975  }
976  // TODO(skal): provide distortion for ARGB too.
977  if (src->use_argb == 1 || src->use_argb != ref->use_argb) {
978    return 0;
979  }
980
981  has_alpha = !!(src->colorspace & WEBP_CSP_ALPHA_BIT);
982  if (has_alpha != !!(ref->colorspace & WEBP_CSP_ALPHA_BIT) ||
983      (has_alpha && (src->a == NULL || ref->a == NULL))) {
984    return 0;
985  }
986
987  memset(stats, 0, sizeof(stats));
988
989  uv_w = HALVE(src->width);
990  uv_h = HALVE(src->height);
991  if (type >= 2) {
992    float sse[4];
993    sse[0] = AccumulateLSIM(src->y, src->y_stride,
994                            ref->y, ref->y_stride, src->width, src->height);
995    sse[1] = AccumulateLSIM(src->u, src->uv_stride,
996                            ref->u, ref->uv_stride, uv_w, uv_h);
997    sse[2] = AccumulateLSIM(src->v, src->uv_stride,
998                            ref->v, ref->uv_stride, uv_w, uv_h);
999    sse[3] = has_alpha ? AccumulateLSIM(src->a, src->a_stride,
1000                                        ref->a, ref->a_stride,
1001                                        src->width, src->height)
1002                       : 0.f;
1003    result[0] = GetPSNR(sse[0] / (src->width * src->height));
1004    result[1] = GetPSNR(sse[1] / (uv_w * uv_h));
1005    result[2] = GetPSNR(sse[2] / (uv_w * uv_h));
1006    result[3] = GetPSNR(sse[3] / (src->width * src->height));
1007    {
1008      double total_sse = sse[0] + sse[1] + sse[2];
1009      int total_pixels = src->width * src->height + 2 * uv_w * uv_h;
1010      if (has_alpha) {
1011        total_pixels += src->width * src->height;
1012        total_sse += sse[3];
1013      }
1014      result[4] = GetPSNR(total_sse / total_pixels);
1015    }
1016  } else {
1017    int c;
1018    VP8SSIMAccumulatePlane(src->y, src->y_stride,
1019                           ref->y, ref->y_stride,
1020                           src->width, src->height, &stats[0]);
1021    VP8SSIMAccumulatePlane(src->u, src->uv_stride,
1022                           ref->u, ref->uv_stride,
1023                           uv_w, uv_h, &stats[1]);
1024    VP8SSIMAccumulatePlane(src->v, src->uv_stride,
1025                           ref->v, ref->uv_stride,
1026                           uv_w, uv_h, &stats[2]);
1027    if (has_alpha) {
1028      VP8SSIMAccumulatePlane(src->a, src->a_stride,
1029                             ref->a, ref->a_stride,
1030                             src->width, src->height, &stats[3]);
1031    }
1032    for (c = 0; c <= 4; ++c) {
1033      if (type == 1) {
1034        const double v = VP8SSIMGet(&stats[c]);
1035        result[c] = (float)((v < 1.) ? -10.0 * log10(1. - v)
1036                                     : kMinDistortion_dB);
1037      } else {
1038        const double v = VP8SSIMGetSquaredError(&stats[c]);
1039        result[c] = GetPSNR(v);
1040      }
1041      // Accumulate forward
1042      if (c < 4) VP8SSIMAddStats(&stats[c], &stats[4]);
1043    }
1044  }
1045  return 1;
1046}
1047
1048//------------------------------------------------------------------------------
1049// Simplest high-level calls:
1050
1051typedef int (*Importer)(WebPPicture* const, const uint8_t* const, int);
1052
1053static size_t Encode(const uint8_t* rgba, int width, int height, int stride,
1054                     Importer import, float quality_factor, int lossless,
1055                     uint8_t** output) {
1056  WebPPicture pic;
1057  WebPConfig config;
1058  WebPMemoryWriter wrt;
1059  int ok;
1060
1061  if (!WebPConfigPreset(&config, WEBP_PRESET_DEFAULT, quality_factor) ||
1062      !WebPPictureInit(&pic)) {
1063    return 0;  // shouldn't happen, except if system installation is broken
1064  }
1065
1066  config.lossless = !!lossless;
1067  pic.use_argb = !!lossless;
1068  pic.width = width;
1069  pic.height = height;
1070  pic.writer = WebPMemoryWrite;
1071  pic.custom_ptr = &wrt;
1072  WebPMemoryWriterInit(&wrt);
1073
1074  ok = import(&pic, rgba, stride) && WebPEncode(&config, &pic);
1075  WebPPictureFree(&pic);
1076  if (!ok) {
1077    free(wrt.mem);
1078    *output = NULL;
1079    return 0;
1080  }
1081  *output = wrt.mem;
1082  return wrt.size;
1083}
1084
1085#define ENCODE_FUNC(NAME, IMPORTER)                                     \
1086size_t NAME(const uint8_t* in, int w, int h, int bps, float q,          \
1087            uint8_t** out) {                                            \
1088  return Encode(in, w, h, bps, IMPORTER, q, 0, out);                    \
1089}
1090
1091ENCODE_FUNC(WebPEncodeRGB, WebPPictureImportRGB);
1092ENCODE_FUNC(WebPEncodeBGR, WebPPictureImportBGR);
1093ENCODE_FUNC(WebPEncodeRGBA, WebPPictureImportRGBA);
1094ENCODE_FUNC(WebPEncodeBGRA, WebPPictureImportBGRA);
1095
1096#undef ENCODE_FUNC
1097
1098#define LOSSLESS_DEFAULT_QUALITY 70.
1099#define LOSSLESS_ENCODE_FUNC(NAME, IMPORTER)                                 \
1100size_t NAME(const uint8_t* in, int w, int h, int bps, uint8_t** out) {       \
1101  return Encode(in, w, h, bps, IMPORTER, LOSSLESS_DEFAULT_QUALITY, 1, out);  \
1102}
1103
1104LOSSLESS_ENCODE_FUNC(WebPEncodeLosslessRGB, WebPPictureImportRGB);
1105LOSSLESS_ENCODE_FUNC(WebPEncodeLosslessBGR, WebPPictureImportBGR);
1106LOSSLESS_ENCODE_FUNC(WebPEncodeLosslessRGBA, WebPPictureImportRGBA);
1107LOSSLESS_ENCODE_FUNC(WebPEncodeLosslessBGRA, WebPPictureImportBGRA);
1108
1109#undef LOSSLESS_ENCODE_FUNC
1110
1111//------------------------------------------------------------------------------
1112
1113#if defined(__cplusplus) || defined(c_plusplus)
1114}    // extern "C"
1115#endif
1116