Coverage Report

Created: 2025-08-12 07:37

/src/libwebp/sharpyuv/sharpyuv.c
Line
Count
Source (jump to first uncovered line)
1
// Copyright 2022 Google Inc. All Rights Reserved.
2
//
3
// Use of this source code is governed by a BSD-style license
4
// that can be found in the COPYING file in the root of the source
5
// tree. An additional intellectual property rights grant can be found
6
// in the file PATENTS. All contributing project authors may
7
// be found in the AUTHORS file in the root of the source tree.
8
// -----------------------------------------------------------------------------
9
//
10
// Sharp RGB to YUV conversion.
11
//
12
// Author: Skal (pascal.massimino@gmail.com)
13
14
#include "sharpyuv/sharpyuv.h"
15
16
#include <assert.h>
17
#include <limits.h>
18
#include <stddef.h>
19
#include <stdlib.h>
20
#include <string.h>
21
22
#include "sharpyuv/sharpyuv_cpu.h"
23
#include "sharpyuv/sharpyuv_dsp.h"
24
#include "sharpyuv/sharpyuv_gamma.h"
25
#include "src/webp/types.h"
26
27
//------------------------------------------------------------------------------
28
29
0
int SharpYuvGetVersion(void) { return SHARPYUV_VERSION; }
30
31
//------------------------------------------------------------------------------
32
// Sharp RGB->YUV conversion
33
34
static const int kNumIterations = 4;
35
36
0
#define YUV_FIX 16  // fixed-point precision for RGB->YUV
37
static const int kYuvHalf = 1 << (YUV_FIX - 1);
38
39
// Max bit depth so that intermediate calculations fit in 16 bits.
40
static const int kMaxBitDepth = 14;
41
42
// Returns the precision shift to use based on the input rgb_bit_depth.
43
0
static int GetPrecisionShift(int rgb_bit_depth) {
44
  // Try to add 2 bits of precision if it fits in kMaxBitDepth. Otherwise remove
45
  // bits if needed.
46
0
  return ((rgb_bit_depth + 2) <= kMaxBitDepth) ? 2
47
0
                                               : (kMaxBitDepth - rgb_bit_depth);
48
0
}
49
50
typedef int16_t fixed_t;     // signed type with extra precision for UV
51
typedef uint16_t fixed_y_t;  // unsigned type with extra precision for W
52
53
//------------------------------------------------------------------------------
54
55
0
static uint8_t clip_8b(fixed_t v) {
56
0
  return (!(v & ~0xff)) ? (uint8_t)v : (v < 0) ? 0u : 255u;
57
0
}
58
59
0
static uint16_t clip(fixed_t v, int max) {
60
0
  return (v < 0) ? 0 : (v > max) ? max : (uint16_t)v;
61
0
}
62
63
0
static fixed_y_t clip_bit_depth(int y, int bit_depth) {
64
0
  const int max = (1 << bit_depth) - 1;
65
0
  return (!(y & ~max)) ? (fixed_y_t)y : (y < 0) ? 0 : max;
66
0
}
67
68
//------------------------------------------------------------------------------
69
70
0
static int RGBToGray(int64_t r, int64_t g, int64_t b) {
71
0
  const int64_t luma = 13933 * r + 46871 * g + 4732 * b + kYuvHalf;
72
0
  return (int)(luma >> YUV_FIX);
73
0
}
74
75
static uint32_t ScaleDown(uint16_t a, uint16_t b, uint16_t c, uint16_t d,
76
                          int rgb_bit_depth,
77
0
                          SharpYuvTransferFunctionType transfer_type) {
78
0
  const int bit_depth = rgb_bit_depth + GetPrecisionShift(rgb_bit_depth);
79
0
  const uint32_t A = SharpYuvGammaToLinear(a, bit_depth, transfer_type);
80
0
  const uint32_t B = SharpYuvGammaToLinear(b, bit_depth, transfer_type);
81
0
  const uint32_t C = SharpYuvGammaToLinear(c, bit_depth, transfer_type);
82
0
  const uint32_t D = SharpYuvGammaToLinear(d, bit_depth, transfer_type);
83
0
  return SharpYuvLinearToGamma((A + B + C + D + 2) >> 2, bit_depth,
84
0
                               transfer_type);
85
0
}
86
87
static WEBP_INLINE void UpdateW(const fixed_y_t* src, fixed_y_t* dst, int w,
88
                                int rgb_bit_depth,
89
0
                                SharpYuvTransferFunctionType transfer_type) {
90
0
  const int bit_depth = rgb_bit_depth + GetPrecisionShift(rgb_bit_depth);
91
0
  int i = 0;
92
0
  do {
93
0
    const uint32_t R =
94
0
        SharpYuvGammaToLinear(src[0 * w + i], bit_depth, transfer_type);
95
0
    const uint32_t G =
96
0
        SharpYuvGammaToLinear(src[1 * w + i], bit_depth, transfer_type);
97
0
    const uint32_t B =
98
0
        SharpYuvGammaToLinear(src[2 * w + i], bit_depth, transfer_type);
99
0
    const uint32_t Y = RGBToGray(R, G, B);
100
0
    dst[i] = (fixed_y_t)SharpYuvLinearToGamma(Y, bit_depth, transfer_type);
101
0
  } while (++i < w);
102
0
}
103
104
static void UpdateChroma(const fixed_y_t* src1, const fixed_y_t* src2,
105
                         fixed_t* dst, int uv_w, int rgb_bit_depth,
106
0
                         SharpYuvTransferFunctionType transfer_type) {
107
0
  int i = 0;
108
0
  do {
109
0
    const int r =
110
0
        ScaleDown(src1[0 * uv_w + 0], src1[0 * uv_w + 1], src2[0 * uv_w + 0],
111
0
                  src2[0 * uv_w + 1], rgb_bit_depth, transfer_type);
112
0
    const int g =
113
0
        ScaleDown(src1[2 * uv_w + 0], src1[2 * uv_w + 1], src2[2 * uv_w + 0],
114
0
                  src2[2 * uv_w + 1], rgb_bit_depth, transfer_type);
115
0
    const int b =
116
0
        ScaleDown(src1[4 * uv_w + 0], src1[4 * uv_w + 1], src2[4 * uv_w + 0],
117
0
                  src2[4 * uv_w + 1], rgb_bit_depth, transfer_type);
118
0
    const int W = RGBToGray(r, g, b);
119
0
    dst[0 * uv_w] = (fixed_t)(r - W);
120
0
    dst[1 * uv_w] = (fixed_t)(g - W);
121
0
    dst[2 * uv_w] = (fixed_t)(b - W);
122
0
    dst += 1;
123
0
    src1 += 2;
124
0
    src2 += 2;
125
0
  } while (++i < uv_w);
126
0
}
127
128
0
static void StoreGray(const fixed_y_t* rgb, fixed_y_t* y, int w) {
129
0
  int i = 0;
130
0
  assert(w > 0);
131
0
  do {
132
0
    y[i] = RGBToGray(rgb[0 * w + i], rgb[1 * w + i], rgb[2 * w + i]);
133
0
  } while (++i < w);
134
0
}
135
136
//------------------------------------------------------------------------------
137
138
0
static WEBP_INLINE fixed_y_t Filter2(int A, int B, int W0, int bit_depth) {
139
0
  const int v0 = (A * 3 + B + 2) >> 2;
140
0
  return clip_bit_depth(v0 + W0, bit_depth);
141
0
}
142
143
//------------------------------------------------------------------------------
144
145
0
static WEBP_INLINE int Shift(int v, int shift) {
146
0
  return (shift >= 0) ? (v << shift) : (v >> -shift);
147
0
}
148
149
static void ImportOneRow(const uint8_t* const r_ptr, const uint8_t* const g_ptr,
150
                         const uint8_t* const b_ptr, int rgb_step,
151
                         int rgb_bit_depth, int pic_width,
152
0
                         fixed_y_t* const dst) {
153
  // Convert the rgb_step from a number of bytes to a number of uint8_t or
154
  // uint16_t values depending the bit depth.
155
0
  const int step = (rgb_bit_depth > 8) ? rgb_step / 2 : rgb_step;
156
0
  int i = 0;
157
0
  const int w = (pic_width + 1) & ~1;
158
0
  do {
159
0
    const int off = i * step;
160
0
    const int shift = GetPrecisionShift(rgb_bit_depth);
161
0
    if (rgb_bit_depth == 8) {
162
0
      dst[i + 0 * w] = Shift(r_ptr[off], shift);
163
0
      dst[i + 1 * w] = Shift(g_ptr[off], shift);
164
0
      dst[i + 2 * w] = Shift(b_ptr[off], shift);
165
0
    } else {
166
0
      dst[i + 0 * w] = Shift(((uint16_t*)r_ptr)[off], shift);
167
0
      dst[i + 1 * w] = Shift(((uint16_t*)g_ptr)[off], shift);
168
0
      dst[i + 2 * w] = Shift(((uint16_t*)b_ptr)[off], shift);
169
0
    }
170
0
  } while (++i < pic_width);
171
0
  if (pic_width & 1) {  // replicate rightmost pixel
172
0
    dst[pic_width + 0 * w] = dst[pic_width + 0 * w - 1];
173
0
    dst[pic_width + 1 * w] = dst[pic_width + 1 * w - 1];
174
0
    dst[pic_width + 2 * w] = dst[pic_width + 2 * w - 1];
175
0
  }
176
0
}
177
178
static void InterpolateTwoRows(const fixed_y_t* const best_y,
179
                               const fixed_t* prev_uv, const fixed_t* cur_uv,
180
                               const fixed_t* next_uv, int w, fixed_y_t* out1,
181
0
                               fixed_y_t* out2, int rgb_bit_depth) {
182
0
  const int uv_w = w >> 1;
183
0
  const int len = (w - 1) >> 1;  // length to filter
184
0
  int k = 3;
185
0
  const int bit_depth = rgb_bit_depth + GetPrecisionShift(rgb_bit_depth);
186
0
  while (k-- > 0) {  // process each R/G/B segments in turn
187
    // special boundary case for i==0
188
0
    out1[0] = Filter2(cur_uv[0], prev_uv[0], best_y[0], bit_depth);
189
0
    out2[0] = Filter2(cur_uv[0], next_uv[0], best_y[w], bit_depth);
190
191
0
    SharpYuvFilterRow(cur_uv, prev_uv, len, best_y + 0 + 1, out1 + 1,
192
0
                      bit_depth);
193
0
    SharpYuvFilterRow(cur_uv, next_uv, len, best_y + w + 1, out2 + 1,
194
0
                      bit_depth);
195
196
    // special boundary case for i == w - 1 when w is even
197
0
    if (!(w & 1)) {
198
0
      out1[w - 1] = Filter2(cur_uv[uv_w - 1], prev_uv[uv_w - 1],
199
0
                            best_y[w - 1 + 0], bit_depth);
200
0
      out2[w - 1] = Filter2(cur_uv[uv_w - 1], next_uv[uv_w - 1],
201
0
                            best_y[w - 1 + w], bit_depth);
202
0
    }
203
0
    out1 += w;
204
0
    out2 += w;
205
0
    prev_uv += uv_w;
206
0
    cur_uv += uv_w;
207
0
    next_uv += uv_w;
208
0
  }
209
0
}
210
211
static WEBP_INLINE int RGBToYUVComponent(int r, int g, int b,
212
0
                                         const int coeffs[4], int sfix) {
213
0
  const int srounder = 1 << (YUV_FIX + sfix - 1);
214
0
  const int luma =
215
0
      coeffs[0] * r + coeffs[1] * g + coeffs[2] * b + coeffs[3] + srounder;
216
0
  return (luma >> (YUV_FIX + sfix));
217
0
}
218
219
static int ConvertWRGBToYUV(const fixed_y_t* best_y, const fixed_t* best_uv,
220
                            uint8_t* y_ptr, int y_stride, uint8_t* u_ptr,
221
                            int u_stride, uint8_t* v_ptr, int v_stride,
222
                            int rgb_bit_depth, int yuv_bit_depth, int width,
223
                            int height,
224
0
                            const SharpYuvConversionMatrix* yuv_matrix) {
225
0
  int i, j;
226
0
  const fixed_t* const best_uv_base = best_uv;
227
0
  const int w = (width + 1) & ~1;
228
0
  const int h = (height + 1) & ~1;
229
0
  const int uv_w = w >> 1;
230
0
  const int uv_h = h >> 1;
231
0
  const int sfix = GetPrecisionShift(rgb_bit_depth);
232
0
  const int yuv_max = (1 << yuv_bit_depth) - 1;
233
234
0
  best_uv = best_uv_base;
235
0
  j = 0;
236
0
  do {
237
0
    i = 0;
238
0
    do {
239
0
      const int off = (i >> 1);
240
0
      const int W = best_y[i];
241
0
      const int r = best_uv[off + 0 * uv_w] + W;
242
0
      const int g = best_uv[off + 1 * uv_w] + W;
243
0
      const int b = best_uv[off + 2 * uv_w] + W;
244
0
      const int y = RGBToYUVComponent(r, g, b, yuv_matrix->rgb_to_y, sfix);
245
0
      if (yuv_bit_depth <= 8) {
246
0
        y_ptr[i] = clip_8b(y);
247
0
      } else {
248
0
        ((uint16_t*)y_ptr)[i] = clip(y, yuv_max);
249
0
      }
250
0
    } while (++i < width);
251
0
    best_y += w;
252
0
    best_uv += (j & 1) * 3 * uv_w;
253
0
    y_ptr += y_stride;
254
0
  } while (++j < height);
255
256
0
  best_uv = best_uv_base;
257
0
  j = 0;
258
0
  do {
259
0
    i = 0;
260
0
    do {
261
      // Note r, g and b values here are off by W, but a constant offset on all
262
      // 3 components doesn't change the value of u and v with a YCbCr matrix.
263
0
      const int r = best_uv[i + 0 * uv_w];
264
0
      const int g = best_uv[i + 1 * uv_w];
265
0
      const int b = best_uv[i + 2 * uv_w];
266
0
      const int u = RGBToYUVComponent(r, g, b, yuv_matrix->rgb_to_u, sfix);
267
0
      const int v = RGBToYUVComponent(r, g, b, yuv_matrix->rgb_to_v, sfix);
268
0
      if (yuv_bit_depth <= 8) {
269
0
        u_ptr[i] = clip_8b(u);
270
0
        v_ptr[i] = clip_8b(v);
271
0
      } else {
272
0
        ((uint16_t*)u_ptr)[i] = clip(u, yuv_max);
273
0
        ((uint16_t*)v_ptr)[i] = clip(v, yuv_max);
274
0
      }
275
0
    } while (++i < uv_w);
276
0
    best_uv += 3 * uv_w;
277
0
    u_ptr += u_stride;
278
0
    v_ptr += v_stride;
279
0
  } while (++j < uv_h);
280
0
  return 1;
281
0
}
282
283
//------------------------------------------------------------------------------
284
// Main function
285
286
0
static void* SafeMalloc(uint64_t nmemb, size_t size) {
287
0
  const uint64_t total_size = nmemb * (uint64_t)size;
288
0
  if (total_size != (size_t)total_size) return NULL;
289
0
  return malloc((size_t)total_size);
290
0
}
291
292
static int DoSharpArgbToYuv(const uint8_t* r_ptr, const uint8_t* g_ptr,
293
                            const uint8_t* b_ptr, int rgb_step, int rgb_stride,
294
                            int rgb_bit_depth, uint8_t* y_ptr, int y_stride,
295
                            uint8_t* u_ptr, int u_stride, uint8_t* v_ptr,
296
                            int v_stride, int yuv_bit_depth, int width,
297
                            int height,
298
                            const SharpYuvConversionMatrix* yuv_matrix,
299
0
                            SharpYuvTransferFunctionType transfer_type) {
300
  // we expand the right/bottom border if needed
301
0
  const int w = (width + 1) & ~1;
302
0
  const int h = (height + 1) & ~1;
303
0
  const int uv_w = w >> 1;
304
0
  const int uv_h = h >> 1;
305
0
  const int y_bit_depth = rgb_bit_depth + GetPrecisionShift(rgb_bit_depth);
306
0
  uint64_t prev_diff_y_sum = ~0;
307
0
  int j, iter;
308
309
0
  const uint64_t tmp_buffer_size = (uint64_t)w * 3 * 2;
310
0
  const uint64_t best_y_base_size = (uint64_t)w * h;
311
0
  const uint64_t target_y_base_size = (uint64_t)w * h;
312
0
  const uint64_t best_rgb_y_size = (uint64_t)w * 2;
313
0
  const uint64_t best_uv_base_size = (uint64_t)uv_w * 3 * uv_h;
314
0
  const uint64_t target_uv_base_size = (uint64_t)uv_w * 3 * uv_h;
315
0
  const uint64_t best_rgb_uv_size = (uint64_t)uv_w * 3;
316
0
  fixed_y_t* const tmp_buffer = (fixed_y_t*)SafeMalloc(
317
0
      (tmp_buffer_size + best_y_base_size + target_y_base_size +
318
0
       best_rgb_y_size) +
319
0
          (best_uv_base_size + target_uv_base_size + best_rgb_uv_size),
320
0
      sizeof(*tmp_buffer));
321
0
  fixed_y_t *best_y_base, *target_y_base, *best_rgb_y;
322
0
  fixed_t *best_uv_base, *target_uv_base, *best_rgb_uv;
323
0
  fixed_y_t *best_y, *target_y;
324
0
  fixed_t *best_uv, *target_uv;
325
0
  const uint64_t diff_y_threshold = (uint64_t)(3.0 * w * h);
326
0
  int ok;
327
0
  assert(w > 0);
328
0
  assert(h > 0);
329
0
  assert(sizeof(fixed_y_t) == sizeof(fixed_t));
330
331
0
  if (tmp_buffer == NULL) {
332
0
    ok = 0;
333
0
    goto End;
334
0
  }
335
0
  best_y_base = tmp_buffer + tmp_buffer_size;
336
0
  target_y_base = best_y_base + best_y_base_size;
337
0
  best_rgb_y = target_y_base + target_y_base_size;
338
0
  best_uv_base = (fixed_t*)(best_rgb_y + best_rgb_y_size);
339
0
  target_uv_base = best_uv_base + best_uv_base_size;
340
0
  best_rgb_uv = target_uv_base + target_uv_base_size;
341
0
  best_y = best_y_base;
342
0
  target_y = target_y_base;
343
0
  best_uv = best_uv_base;
344
0
  target_uv = target_uv_base;
345
346
  // Import RGB samples to W/RGB representation.
347
0
  for (j = 0; j < height; j += 2) {
348
0
    const int is_last_row = (j == height - 1);
349
0
    fixed_y_t* const src1 = tmp_buffer + 0 * w;
350
0
    fixed_y_t* const src2 = tmp_buffer + 3 * w;
351
352
    // prepare two rows of input
353
0
    ImportOneRow(r_ptr, g_ptr, b_ptr, rgb_step, rgb_bit_depth, width, src1);
354
0
    if (!is_last_row) {
355
0
      ImportOneRow(r_ptr + rgb_stride, g_ptr + rgb_stride, b_ptr + rgb_stride,
356
0
                   rgb_step, rgb_bit_depth, width, src2);
357
0
    } else {
358
0
      memcpy(src2, src1, 3 * w * sizeof(*src2));
359
0
    }
360
0
    StoreGray(src1, best_y + 0, w);
361
0
    StoreGray(src2, best_y + w, w);
362
363
0
    UpdateW(src1, target_y, w, rgb_bit_depth, transfer_type);
364
0
    UpdateW(src2, target_y + w, w, rgb_bit_depth, transfer_type);
365
0
    UpdateChroma(src1, src2, target_uv, uv_w, rgb_bit_depth, transfer_type);
366
0
    memcpy(best_uv, target_uv, 3 * uv_w * sizeof(*best_uv));
367
0
    best_y += 2 * w;
368
0
    best_uv += 3 * uv_w;
369
0
    target_y += 2 * w;
370
0
    target_uv += 3 * uv_w;
371
0
    r_ptr += 2 * rgb_stride;
372
0
    g_ptr += 2 * rgb_stride;
373
0
    b_ptr += 2 * rgb_stride;
374
0
  }
375
376
  // Iterate and resolve clipping conflicts.
377
0
  for (iter = 0; iter < kNumIterations; ++iter) {
378
0
    const fixed_t* cur_uv = best_uv_base;
379
0
    const fixed_t* prev_uv = best_uv_base;
380
0
    uint64_t diff_y_sum = 0;
381
382
0
    best_y = best_y_base;
383
0
    best_uv = best_uv_base;
384
0
    target_y = target_y_base;
385
0
    target_uv = target_uv_base;
386
0
    j = 0;
387
0
    do {
388
0
      fixed_y_t* const src1 = tmp_buffer + 0 * w;
389
0
      fixed_y_t* const src2 = tmp_buffer + 3 * w;
390
0
      {
391
0
        const fixed_t* const next_uv = cur_uv + ((j < h - 2) ? 3 * uv_w : 0);
392
0
        InterpolateTwoRows(best_y, prev_uv, cur_uv, next_uv, w, src1, src2,
393
0
                           rgb_bit_depth);
394
0
        prev_uv = cur_uv;
395
0
        cur_uv = next_uv;
396
0
      }
397
398
0
      UpdateW(src1, best_rgb_y + 0 * w, w, rgb_bit_depth, transfer_type);
399
0
      UpdateW(src2, best_rgb_y + 1 * w, w, rgb_bit_depth, transfer_type);
400
0
      UpdateChroma(src1, src2, best_rgb_uv, uv_w, rgb_bit_depth, transfer_type);
401
402
      // update two rows of Y and one row of RGB
403
0
      diff_y_sum +=
404
0
          SharpYuvUpdateY(target_y, best_rgb_y, best_y, 2 * w, y_bit_depth);
405
0
      SharpYuvUpdateRGB(target_uv, best_rgb_uv, best_uv, 3 * uv_w);
406
407
0
      best_y += 2 * w;
408
0
      best_uv += 3 * uv_w;
409
0
      target_y += 2 * w;
410
0
      target_uv += 3 * uv_w;
411
0
      j += 2;
412
0
    } while (j < h);
413
    // test exit condition
414
0
    if (iter > 0) {
415
0
      if (diff_y_sum < diff_y_threshold) break;
416
0
      if (diff_y_sum > prev_diff_y_sum) break;
417
0
    }
418
0
    prev_diff_y_sum = diff_y_sum;
419
0
  }
420
421
  // final reconstruction
422
0
  ok = ConvertWRGBToYUV(best_y_base, best_uv_base, y_ptr, y_stride, u_ptr,
423
0
                        u_stride, v_ptr, v_stride, rgb_bit_depth, yuv_bit_depth,
424
0
                        width, height, yuv_matrix);
425
426
0
End:
427
0
  free(tmp_buffer);
428
0
  return ok;
429
0
}
430
431
#if defined(WEBP_USE_THREAD) && !defined(_WIN32)
432
#include <pthread.h>  // NOLINT
433
434
#define LOCK_ACCESS                                                 \
435
0
  static pthread_mutex_t sharpyuv_lock = PTHREAD_MUTEX_INITIALIZER; \
436
0
  if (pthread_mutex_lock(&sharpyuv_lock)) return
437
#define UNLOCK_ACCESS_AND_RETURN                \
438
0
  do {                                          \
439
0
    (void)pthread_mutex_unlock(&sharpyuv_lock); \
440
0
    return;                                     \
441
0
  } while (0)
442
#else  // !(defined(WEBP_USE_THREAD) && !defined(_WIN32))
443
#define LOCK_ACCESS \
444
  do {              \
445
  } while (0)
446
#define UNLOCK_ACCESS_AND_RETURN return
447
#endif  // defined(WEBP_USE_THREAD) && !defined(_WIN32)
448
449
// Hidden exported init function.
450
// By default SharpYuvConvert calls it with SharpYuvGetCPUInfo. If needed,
451
// users can declare it as extern and call it with an alternate VP8CPUInfo
452
// function.
453
extern VP8CPUInfo SharpYuvGetCPUInfo;
454
SHARPYUV_EXTERN void SharpYuvInit(VP8CPUInfo cpu_info_func);
455
0
void SharpYuvInit(VP8CPUInfo cpu_info_func) {
456
0
  static volatile VP8CPUInfo sharpyuv_last_cpuinfo_used =
457
0
      (VP8CPUInfo)&sharpyuv_last_cpuinfo_used;
458
0
  LOCK_ACCESS;
459
  // Only update SharpYuvGetCPUInfo when called from external code to avoid a
460
  // race on reading the value in SharpYuvConvert().
461
0
  if (cpu_info_func != (VP8CPUInfo)&SharpYuvGetCPUInfo) {
462
0
    SharpYuvGetCPUInfo = cpu_info_func;
463
0
  }
464
0
  if (sharpyuv_last_cpuinfo_used == SharpYuvGetCPUInfo) {
465
0
    UNLOCK_ACCESS_AND_RETURN;
466
0
  }
467
468
0
  SharpYuvInitDsp();
469
0
  SharpYuvInitGammaTables();
470
471
0
  sharpyuv_last_cpuinfo_used = SharpYuvGetCPUInfo;
472
0
  UNLOCK_ACCESS_AND_RETURN;
473
0
}
474
475
int SharpYuvConvert(const void* r_ptr, const void* g_ptr, const void* b_ptr,
476
                    int rgb_step, int rgb_stride, int rgb_bit_depth,
477
                    void* y_ptr, int y_stride, void* u_ptr, int u_stride,
478
                    void* v_ptr, int v_stride, int yuv_bit_depth, int width,
479
0
                    int height, const SharpYuvConversionMatrix* yuv_matrix) {
480
0
  SharpYuvOptions options;
481
0
  options.yuv_matrix = yuv_matrix;
482
0
  options.transfer_type = kSharpYuvTransferFunctionSrgb;
483
0
  return SharpYuvConvertWithOptions(
484
0
      r_ptr, g_ptr, b_ptr, rgb_step, rgb_stride, rgb_bit_depth, y_ptr, y_stride,
485
0
      u_ptr, u_stride, v_ptr, v_stride, yuv_bit_depth, width, height, &options);
486
0
}
487
488
int SharpYuvOptionsInitInternal(const SharpYuvConversionMatrix* yuv_matrix,
489
0
                                SharpYuvOptions* options, int version) {
490
0
  const int major = (version >> 24);
491
0
  const int minor = (version >> 16) & 0xff;
492
0
  if (options == NULL || yuv_matrix == NULL ||
493
0
      (major == SHARPYUV_VERSION_MAJOR && major == 0 &&
494
0
       minor != SHARPYUV_VERSION_MINOR) ||
495
0
      (major != SHARPYUV_VERSION_MAJOR)) {
496
0
    return 0;
497
0
  }
498
0
  options->yuv_matrix = yuv_matrix;
499
0
  options->transfer_type = kSharpYuvTransferFunctionSrgb;
500
0
  return 1;
501
0
}
502
503
int SharpYuvConvertWithOptions(const void* r_ptr, const void* g_ptr,
504
                               const void* b_ptr, int rgb_step, int rgb_stride,
505
                               int rgb_bit_depth, void* y_ptr, int y_stride,
506
                               void* u_ptr, int u_stride, void* v_ptr,
507
                               int v_stride, int yuv_bit_depth, int width,
508
0
                               int height, const SharpYuvOptions* options) {
509
0
  const SharpYuvConversionMatrix* yuv_matrix = options->yuv_matrix;
510
0
  SharpYuvTransferFunctionType transfer_type = options->transfer_type;
511
0
  SharpYuvConversionMatrix scaled_matrix;
512
0
  const int rgb_max = (1 << rgb_bit_depth) - 1;
513
0
  const int rgb_round = 1 << (rgb_bit_depth - 1);
514
0
  const int yuv_max = (1 << yuv_bit_depth) - 1;
515
0
  const int sfix = GetPrecisionShift(rgb_bit_depth);
516
517
0
  if (width < 1 || height < 1 || width == INT_MAX || height == INT_MAX ||
518
0
      r_ptr == NULL || g_ptr == NULL || b_ptr == NULL || y_ptr == NULL ||
519
0
      u_ptr == NULL || v_ptr == NULL) {
520
0
    return 0;
521
0
  }
522
0
  if (rgb_bit_depth != 8 && rgb_bit_depth != 10 && rgb_bit_depth != 12 &&
523
0
      rgb_bit_depth != 16) {
524
0
    return 0;
525
0
  }
526
0
  if (yuv_bit_depth != 8 && yuv_bit_depth != 10 && yuv_bit_depth != 12) {
527
0
    return 0;
528
0
  }
529
0
  if (rgb_bit_depth > 8 && (rgb_step % 2 != 0 || rgb_stride % 2 != 0)) {
530
    // Step/stride should be even for uint16_t buffers.
531
0
    return 0;
532
0
  }
533
0
  if (yuv_bit_depth > 8 &&
534
0
      (y_stride % 2 != 0 || u_stride % 2 != 0 || v_stride % 2 != 0)) {
535
    // Stride should be even for uint16_t buffers.
536
0
    return 0;
537
0
  }
538
  // The address of the function pointer is used to avoid a read race.
539
0
  SharpYuvInit((VP8CPUInfo)&SharpYuvGetCPUInfo);
540
541
  // Add scaling factor to go from rgb_bit_depth to yuv_bit_depth, to the
542
  // rgb->yuv conversion matrix.
543
0
  if (rgb_bit_depth == yuv_bit_depth) {
544
0
    memcpy(&scaled_matrix, yuv_matrix, sizeof(scaled_matrix));
545
0
  } else {
546
0
    int i;
547
0
    for (i = 0; i < 3; ++i) {
548
0
      scaled_matrix.rgb_to_y[i] =
549
0
          (yuv_matrix->rgb_to_y[i] * yuv_max + rgb_round) / rgb_max;
550
0
      scaled_matrix.rgb_to_u[i] =
551
0
          (yuv_matrix->rgb_to_u[i] * yuv_max + rgb_round) / rgb_max;
552
0
      scaled_matrix.rgb_to_v[i] =
553
0
          (yuv_matrix->rgb_to_v[i] * yuv_max + rgb_round) / rgb_max;
554
0
    }
555
0
  }
556
  // Also incorporate precision change scaling.
557
0
  scaled_matrix.rgb_to_y[3] = Shift(yuv_matrix->rgb_to_y[3], sfix);
558
0
  scaled_matrix.rgb_to_u[3] = Shift(yuv_matrix->rgb_to_u[3], sfix);
559
0
  scaled_matrix.rgb_to_v[3] = Shift(yuv_matrix->rgb_to_v[3], sfix);
560
561
0
  return DoSharpArgbToYuv(
562
0
      (const uint8_t*)r_ptr, (const uint8_t*)g_ptr, (const uint8_t*)b_ptr,
563
0
      rgb_step, rgb_stride, rgb_bit_depth, (uint8_t*)y_ptr, y_stride,
564
0
      (uint8_t*)u_ptr, u_stride, (uint8_t*)v_ptr, v_stride, yuv_bit_depth,
565
0
      width, height, &scaled_matrix, transfer_type);
566
0
}
567
568
//------------------------------------------------------------------------------