Coverage Report

Created: 2025-08-12 07:37

/src/libwebp/src/enc/iterator_enc.c
Line
Count
Source (jump to first uncovered line)
1
// Copyright 2011 Google Inc. All Rights Reserved.
2
//
3
// Use of this source code is governed by a BSD-style license
4
// that can be found in the COPYING file in the root of the source
5
// tree. An additional intellectual property rights grant can be found
6
// in the file PATENTS. All contributing project authors may
7
// be found in the AUTHORS file in the root of the source tree.
8
// -----------------------------------------------------------------------------
9
//
10
// VP8Iterator: block iterator
11
//
12
// Author: Skal (pascal.massimino@gmail.com)
13
14
#include <string.h>
15
16
#include "src/dsp/cpu.h"
17
#include "src/dsp/dsp.h"
18
#include "src/enc/vp8i_enc.h"
19
#include "src/utils/utils.h"
20
#include "src/webp/types.h"
21
22
//------------------------------------------------------------------------------
23
// VP8Iterator
24
//------------------------------------------------------------------------------
25
26
2.90k
static void InitLeft(VP8EncIterator* const it) {
27
2.90k
  it->y_left[-1] = it->u_left[-1] = it->v_left[-1] = (it->y > 0) ? 129 : 127;
28
2.90k
  memset(it->y_left, 129, 16);
29
2.90k
  memset(it->u_left, 129, 8);
30
2.90k
  memset(it->v_left, 129, 8);
31
2.90k
  it->left_nz[8] = 0;
32
2.90k
  if (it->top_derr != NULL) {
33
2.90k
    memset(&it->left_derr, 0, sizeof(it->left_derr));
34
2.90k
  }
35
2.90k
}
36
37
162
static void InitTop(VP8EncIterator* const it) {
38
162
  const VP8Encoder* const enc = it->enc;
39
162
  const size_t top_size = enc->mb_w * 16;
40
162
  memset(enc->y_top, 127, 2 * top_size);
41
162
  memset(enc->nz, 0, enc->mb_w * sizeof(*enc->nz));
42
162
  if (enc->top_derr != NULL) {
43
162
    memset(enc->top_derr, 0, enc->mb_w * sizeof(*enc->top_derr));
44
162
  }
45
162
}
46
47
2.23k
void VP8IteratorSetRow(VP8EncIterator* const it, int y) {
48
2.23k
  VP8Encoder* const enc = it->enc;
49
2.23k
  it->x = 0;
50
2.23k
  it->y = y;
51
2.23k
  it->bw = &enc->parts[y & (enc->num_parts - 1)];
52
2.23k
  it->preds = enc->preds + y * 4 * enc->preds_w;
53
2.23k
  it->nz = enc->nz;
54
2.23k
  it->mb = enc->mb_info + y * enc->mb_w;
55
2.23k
  it->y_top = enc->y_top;
56
2.23k
  it->uv_top = enc->uv_top;
57
2.23k
  InitLeft(it);
58
2.23k
}
59
60
// restart a scan
61
162
static void VP8IteratorReset(VP8EncIterator* const it) {
62
162
  VP8Encoder* const enc = it->enc;
63
162
  VP8IteratorSetRow(it, 0);
64
162
  VP8IteratorSetCountDown(it, enc->mb_w * enc->mb_h);  // default
65
162
  InitTop(it);
66
162
  memset(it->bit_count, 0, sizeof(it->bit_count));
67
162
  it->do_trellis = 0;
68
162
}
69
70
216
void VP8IteratorSetCountDown(VP8EncIterator* const it, int count_down) {
71
216
  it->count_down = it->count_down0 = count_down;
72
216
}
73
74
54
int VP8IteratorIsDone(const VP8EncIterator* const it) {
75
54
  return (it->count_down <= 0);
76
54
}
77
78
162
void VP8IteratorInit(VP8Encoder* const enc, VP8EncIterator* const it) {
79
162
  it->enc = enc;
80
162
  it->yuv_in = (uint8_t*)WEBP_ALIGN(it->yuv_mem);
81
162
  it->yuv_out = it->yuv_in + YUV_SIZE_ENC;
82
162
  it->yuv_out2 = it->yuv_out + YUV_SIZE_ENC;
83
162
  it->yuv_p = it->yuv_out2 + YUV_SIZE_ENC;
84
162
  it->lf_stats = enc->lf_stats;
85
162
  it->percent0 = enc->percent;
86
162
  it->y_left = (uint8_t*)WEBP_ALIGN(it->yuv_left_mem + 1);
87
162
  it->u_left = it->y_left + 16 + 16;
88
162
  it->v_left = it->u_left + 16;
89
162
  it->top_derr = enc->top_derr;
90
162
  VP8IteratorReset(it);
91
162
}
92
93
28.3k
int VP8IteratorProgress(const VP8EncIterator* const it, int delta) {
94
28.3k
  VP8Encoder* const enc = it->enc;
95
28.3k
  if (delta && enc->pic->progress_hook != NULL) {
96
0
    const int done = it->count_down0 - it->count_down;
97
0
    const int percent = (it->count_down0 <= 0)
98
0
                            ? it->percent0
99
0
                            : it->percent0 + delta * done / it->count_down0;
100
0
    return WebPReportProgress(enc->pic, percent, &enc->percent);
101
0
  }
102
28.3k
  return 1;
103
28.3k
}
104
105
//------------------------------------------------------------------------------
106
// Import the source samples into the cache. Takes care of replicating
107
// boundary pixels if necessary.
108
109
56.6k
static WEBP_INLINE int MinSize(int a, int b) { return (a < b) ? a : b; }
110
111
static void ImportBlock(const uint8_t* src, int src_stride, uint8_t* dst, int w,
112
84.9k
                        int h, int size) {
113
84.9k
  int i;
114
968k
  for (i = 0; i < h; ++i) {
115
883k
    memcpy(dst, src, w);
116
883k
    if (w < size) {
117
38.8k
      memset(dst + w, dst[w - 1], size - w);
118
38.8k
    }
119
883k
    dst += BPS;
120
883k
    src += src_stride;
121
883k
  }
122
106k
  for (i = h; i < size; ++i) {
123
21.9k
    memcpy(dst, dst - BPS, size);
124
21.9k
    dst += BPS;
125
21.9k
  }
126
84.9k
}
127
128
static void ImportLine(const uint8_t* src, int src_stride, uint8_t* dst,
129
80.0k
                       int len, int total_len) {
130
80.0k
  int i;
131
909k
  for (i = 0; i < len; ++i, src += src_stride) dst[i] = *src;
132
103k
  for (; i < total_len; ++i) dst[i] = dst[len - 1];
133
80.0k
}
134
135
28.3k
void VP8IteratorImport(VP8EncIterator* const it, uint8_t* const tmp_32) {
136
28.3k
  const VP8Encoder* const enc = it->enc;
137
28.3k
  const int x = it->x, y = it->y;
138
28.3k
  const WebPPicture* const pic = enc->pic;
139
28.3k
  const uint8_t* const ysrc = pic->y + (y * pic->y_stride + x) * 16;
140
28.3k
  const uint8_t* const usrc = pic->u + (y * pic->uv_stride + x) * 8;
141
28.3k
  const uint8_t* const vsrc = pic->v + (y * pic->uv_stride + x) * 8;
142
28.3k
  const int w = MinSize(pic->width - x * 16, 16);
143
28.3k
  const int h = MinSize(pic->height - y * 16, 16);
144
28.3k
  const int uv_w = (w + 1) >> 1;
145
28.3k
  const int uv_h = (h + 1) >> 1;
146
147
28.3k
  ImportBlock(ysrc, pic->y_stride, it->yuv_in + Y_OFF_ENC, w, h, 16);
148
28.3k
  ImportBlock(usrc, pic->uv_stride, it->yuv_in + U_OFF_ENC, uv_w, uv_h, 8);
149
28.3k
  ImportBlock(vsrc, pic->uv_stride, it->yuv_in + V_OFF_ENC, uv_w, uv_h, 8);
150
151
28.3k
  if (tmp_32 == NULL) return;
152
153
  // Import source (uncompressed) samples into boundary.
154
14.1k
  if (x == 0) {
155
672
    InitLeft(it);
156
13.4k
  } else {
157
13.4k
    if (y == 0) {
158
908
      it->y_left[-1] = it->u_left[-1] = it->v_left[-1] = 127;
159
12.5k
    } else {
160
12.5k
      it->y_left[-1] = ysrc[-1 - pic->y_stride];
161
12.5k
      it->u_left[-1] = usrc[-1 - pic->uv_stride];
162
12.5k
      it->v_left[-1] = vsrc[-1 - pic->uv_stride];
163
12.5k
    }
164
13.4k
    ImportLine(ysrc - 1, pic->y_stride, it->y_left, h, 16);
165
13.4k
    ImportLine(usrc - 1, pic->uv_stride, it->u_left, uv_h, 8);
166
13.4k
    ImportLine(vsrc - 1, pic->uv_stride, it->v_left, uv_h, 8);
167
13.4k
  }
168
169
14.1k
  it->y_top = tmp_32 + 0;
170
14.1k
  it->uv_top = tmp_32 + 16;
171
14.1k
  if (y == 0) {
172
962
    memset(tmp_32, 127, 32 * sizeof(*tmp_32));
173
13.1k
  } else {
174
13.1k
    ImportLine(ysrc - pic->y_stride, 1, tmp_32, w, 16);
175
13.1k
    ImportLine(usrc - pic->uv_stride, 1, tmp_32 + 16, uv_w, 8);
176
13.1k
    ImportLine(vsrc - pic->uv_stride, 1, tmp_32 + 16 + 8, uv_w, 8);
177
13.1k
  }
178
14.1k
}
179
180
//------------------------------------------------------------------------------
181
// Copy back the compressed samples into user space if requested.
182
183
static void ExportBlock(const uint8_t* src, uint8_t* dst, int dst_stride, int w,
184
0
                        int h) {
185
0
  while (h-- > 0) {
186
0
    memcpy(dst, src, w);
187
0
    dst += dst_stride;
188
0
    src += BPS;
189
0
  }
190
0
}
191
192
14.1k
void VP8IteratorExport(const VP8EncIterator* const it) {
193
14.1k
  const VP8Encoder* const enc = it->enc;
194
14.1k
  if (enc->config->show_compressed) {
195
0
    const int x = it->x, y = it->y;
196
0
    const uint8_t* const ysrc = it->yuv_out + Y_OFF_ENC;
197
0
    const uint8_t* const usrc = it->yuv_out + U_OFF_ENC;
198
0
    const uint8_t* const vsrc = it->yuv_out + V_OFF_ENC;
199
0
    const WebPPicture* const pic = enc->pic;
200
0
    uint8_t* const ydst = pic->y + (y * pic->y_stride + x) * 16;
201
0
    uint8_t* const udst = pic->u + (y * pic->uv_stride + x) * 8;
202
0
    uint8_t* const vdst = pic->v + (y * pic->uv_stride + x) * 8;
203
0
    int w = (pic->width - x * 16);
204
0
    int h = (pic->height - y * 16);
205
206
0
    if (w > 16) w = 16;
207
0
    if (h > 16) h = 16;
208
209
    // Luma plane
210
0
    ExportBlock(ysrc, ydst, pic->y_stride, w, h);
211
212
0
    {  // U/V planes
213
0
      const int uv_w = (w + 1) >> 1;
214
0
      const int uv_h = (h + 1) >> 1;
215
0
      ExportBlock(usrc, udst, pic->uv_stride, uv_w, uv_h);
216
0
      ExportBlock(vsrc, vdst, pic->uv_stride, uv_w, uv_h);
217
0
    }
218
0
  }
219
14.1k
}
220
221
//------------------------------------------------------------------------------
222
// Non-zero contexts setup/teardown
223
224
// Nz bits:
225
//  0  1  2  3  Y
226
//  4  5  6  7
227
//  8  9 10 11
228
// 12 13 14 15
229
// 16 17        U
230
// 18 19
231
// 20 21        V
232
// 22 23
233
// 24           DC-intra16
234
235
// Convert packed context to byte array
236
2.40M
#define BIT(nz, n) (!!((nz) & (1 << (n))))
237
238
141k
void VP8IteratorNzToBytes(VP8EncIterator* const it) {
239
141k
  const int tnz = it->nz[0], lnz = it->nz[-1];
240
141k
  int* const top_nz = it->top_nz;
241
141k
  int* const left_nz = it->left_nz;
242
243
  // Top-Y
244
141k
  top_nz[0] = BIT(tnz, 12);
245
141k
  top_nz[1] = BIT(tnz, 13);
246
141k
  top_nz[2] = BIT(tnz, 14);
247
141k
  top_nz[3] = BIT(tnz, 15);
248
  // Top-U
249
141k
  top_nz[4] = BIT(tnz, 18);
250
141k
  top_nz[5] = BIT(tnz, 19);
251
  // Top-V
252
141k
  top_nz[6] = BIT(tnz, 22);
253
141k
  top_nz[7] = BIT(tnz, 23);
254
  // DC
255
141k
  top_nz[8] = BIT(tnz, 24);
256
257
  // left-Y
258
141k
  left_nz[0] = BIT(lnz, 3);
259
141k
  left_nz[1] = BIT(lnz, 7);
260
141k
  left_nz[2] = BIT(lnz, 11);
261
141k
  left_nz[3] = BIT(lnz, 15);
262
  // left-U
263
141k
  left_nz[4] = BIT(lnz, 17);
264
141k
  left_nz[5] = BIT(lnz, 19);
265
  // left-V
266
141k
  left_nz[6] = BIT(lnz, 21);
267
141k
  left_nz[7] = BIT(lnz, 23);
268
  // left-DC is special, iterated separately
269
141k
}
270
271
14.1k
void VP8IteratorBytesToNz(VP8EncIterator* const it) {
272
14.1k
  uint32_t nz = 0;
273
14.1k
  const int* const top_nz = it->top_nz;
274
14.1k
  const int* const left_nz = it->left_nz;
275
  // top
276
14.1k
  nz |= (top_nz[0] << 12) | (top_nz[1] << 13);
277
14.1k
  nz |= (top_nz[2] << 14) | (top_nz[3] << 15);
278
14.1k
  nz |= (top_nz[4] << 18) | (top_nz[5] << 19);
279
14.1k
  nz |= (top_nz[6] << 22) | (top_nz[7] << 23);
280
14.1k
  nz |= (top_nz[8] << 24);  // we propagate the _top_ bit, esp. for intra4
281
  // left
282
14.1k
  nz |= (left_nz[0] << 3) | (left_nz[1] << 7);
283
14.1k
  nz |= (left_nz[2] << 11);
284
14.1k
  nz |= (left_nz[4] << 17) | (left_nz[6] << 21);
285
286
14.1k
  *it->nz = nz;
287
14.1k
}
288
289
#undef BIT
290
291
//------------------------------------------------------------------------------
292
// Advance to the next position, doing the bookkeeping.
293
294
14.1k
void VP8IteratorSaveBoundary(VP8EncIterator* const it) {
295
14.1k
  VP8Encoder* const enc = it->enc;
296
14.1k
  const int x = it->x, y = it->y;
297
14.1k
  const uint8_t* const ysrc = it->yuv_out + Y_OFF_ENC;
298
14.1k
  const uint8_t* const uvsrc = it->yuv_out + U_OFF_ENC;
299
14.1k
  if (x < enc->mb_w - 1) {  // left
300
13.4k
    int i;
301
229k
    for (i = 0; i < 16; ++i) {
302
215k
      it->y_left[i] = ysrc[15 + i * BPS];
303
215k
    }
304
121k
    for (i = 0; i < 8; ++i) {
305
107k
      it->u_left[i] = uvsrc[7 + i * BPS];
306
107k
      it->v_left[i] = uvsrc[15 + i * BPS];
307
107k
    }
308
    // top-left (before 'top'!)
309
13.4k
    it->y_left[-1] = it->y_top[15];
310
13.4k
    it->u_left[-1] = it->uv_top[0 + 7];
311
13.4k
    it->v_left[-1] = it->uv_top[8 + 7];
312
13.4k
  }
313
14.1k
  if (y < enc->mb_h - 1) {  // top
314
13.1k
    memcpy(it->y_top, ysrc + 15 * BPS, 16);
315
13.1k
    memcpy(it->uv_top, uvsrc + 7 * BPS, 8 + 8);
316
13.1k
  }
317
14.1k
}
318
319
42.4k
int VP8IteratorNext(VP8EncIterator* const it) {
320
42.4k
  if (++it->x == it->enc->mb_w) {
321
2.01k
    VP8IteratorSetRow(it, ++it->y);
322
40.4k
  } else {
323
40.4k
    it->preds += 4;
324
40.4k
    it->mb += 1;
325
40.4k
    it->nz += 1;
326
40.4k
    it->y_top += 16;
327
40.4k
    it->uv_top += 16;
328
40.4k
  }
329
42.4k
  return (0 < --it->count_down);
330
42.4k
}
331
332
//------------------------------------------------------------------------------
333
// Helper function to set mode properties
334
335
42.4k
void VP8SetIntra16Mode(const VP8EncIterator* const it, int mode) {
336
42.4k
  uint8_t* preds = it->preds;
337
42.4k
  int y;
338
212k
  for (y = 0; y < 4; ++y) {
339
169k
    memset(preds, mode, 4);
340
169k
    preds += it->enc->preds_w;
341
169k
  }
342
42.4k
  it->mb->type = 1;
343
42.4k
}
344
345
1.37k
void VP8SetIntra4Mode(const VP8EncIterator* const it, const uint8_t* modes) {
346
1.37k
  uint8_t* preds = it->preds;
347
1.37k
  int y;
348
6.88k
  for (y = 4; y > 0; --y) {
349
5.50k
    memcpy(preds, modes, 4 * sizeof(*modes));
350
5.50k
    preds += it->enc->preds_w;
351
5.50k
    modes += 4;
352
5.50k
  }
353
1.37k
  it->mb->type = 0;
354
1.37k
}
355
356
28.3k
void VP8SetIntraUVMode(const VP8EncIterator* const it, int mode) {
357
28.3k
  it->mb->uv_mode = mode;
358
28.3k
}
359
360
28.3k
void VP8SetSkip(const VP8EncIterator* const it, int skip) {
361
28.3k
  it->mb->skip = skip;
362
28.3k
}
363
364
14.1k
void VP8SetSegment(const VP8EncIterator* const it, int segment) {
365
14.1k
  it->mb->segment = segment;
366
14.1k
}
367
368
//------------------------------------------------------------------------------
369
// Intra4x4 sub-blocks iteration
370
//
371
//  We store and update the boundary samples into an array of 37 pixels. They
372
//  are updated as we iterate and reconstructs each intra4x4 blocks in turn.
373
//  The position of the samples has the following snake pattern:
374
//
375
// 16|17 18 19 20|21 22 23 24|25 26 27 28|29 30 31 32|33 34 35 36  <- Top-right
376
// --+-----------+-----------+-----------+-----------+
377
// 15|         19|         23|         27|         31|
378
// 14|         18|         22|         26|         30|
379
// 13|         17|         21|         25|         29|
380
// 12|13 14 15 16|17 18 19 20|21 22 23 24|25 26 27 28|
381
// --+-----------+-----------+-----------+-----------+
382
// 11|         15|         19|         23|         27|
383
// 10|         14|         18|         22|         26|
384
//  9|         13|         17|         21|         25|
385
//  8| 9 10 11 12|13 14 15 16|17 18 19 20|21 22 23 24|
386
// --+-----------+-----------+-----------+-----------+
387
//  7|         11|         15|         19|         23|
388
//  6|         10|         14|         18|         22|
389
//  5|          9|         13|         17|         21|
390
//  4| 5  6  7  8| 9 10 11 12|13 14 15 16|17 18 19 20|
391
// --+-----------+-----------+-----------+-----------+
392
//  3|          7|         11|         15|         19|
393
//  2|          6|         10|         14|         18|
394
//  1|          5|          9|         13|         17|
395
//  0| 1  2  3  4| 5  6  7  8| 9 10 11 12|13 14 15 16|
396
// --+-----------+-----------+-----------+-----------+
397
398
// Array to record the position of the top sample to pass to the prediction
399
// functions in dsp.c.
400
static const uint8_t VP8TopLeftI4[16] = {17, 21, 25, 29, 13, 17, 21, 25,
401
                                         9,  13, 17, 21, 5,  9,  13, 17};
402
403
14.1k
void VP8IteratorStartI4(VP8EncIterator* const it) {
404
14.1k
  const VP8Encoder* const enc = it->enc;
405
14.1k
  int i;
406
407
14.1k
  it->i4 = 0;  // first 4x4 sub-block
408
14.1k
  it->i4_top = it->i4_boundary + VP8TopLeftI4[0];
409
410
  // Import the boundary samples
411
254k
  for (i = 0; i < 17; ++i) {  // left
412
240k
    it->i4_boundary[i] = it->y_left[15 - i];
413
240k
  }
414
240k
  for (i = 0; i < 16; ++i) {  // top
415
226k
    it->i4_boundary[17 + i] = it->y_top[i];
416
226k
  }
417
  // top-right samples have a special case on the far right of the picture
418
14.1k
  if (it->x < enc->mb_w - 1) {
419
67.4k
    for (i = 16; i < 16 + 4; ++i) {
420
53.9k
      it->i4_boundary[17 + i] = it->y_top[i];
421
53.9k
    }
422
13.4k
  } else {  // else, replicate the last valid pixel four times
423
3.36k
    for (i = 16; i < 16 + 4; ++i) {
424
2.68k
      it->i4_boundary[17 + i] = it->i4_boundary[17 + 15];
425
2.68k
    }
426
672
  }
427
#if WEBP_AARCH64 && BPS == 32 && defined(WEBP_MSAN)
428
  // Intra4Preds_NEON() reads 3 uninitialized bytes from 'i4_boundary' when top
429
  // is positioned at offset 29 (VP8TopLeftI4[3]). The values are not used
430
  // meaningfully, but due to limitations in MemorySanitizer related to
431
  // modeling of tbl instructions, a warning will be issued. This can be
432
  // removed if MSan is updated to support the instructions. See
433
  // https://issues.webmproject.org/372109644.
434
  memset(it->i4_boundary + sizeof(it->i4_boundary) - 3, 0xaa, 3);
435
#endif
436
14.1k
  VP8IteratorNzToBytes(it);  // import the non-zero context
437
14.1k
}
438
439
int VP8IteratorRotateI4(VP8EncIterator* const it,
440
70.6k
                        const uint8_t* const yuv_out) {
441
70.6k
  const uint8_t* const blk = yuv_out + VP8Scan[it->i4];
442
70.6k
  uint8_t* const top = it->i4_top;
443
70.6k
  int i;
444
445
  // Update the cache with 7 fresh samples
446
353k
  for (i = 0; i <= 3; ++i) {
447
282k
    top[-4 + i] = blk[i + 3 * BPS];  // store future top samples
448
282k
  }
449
70.6k
  if ((it->i4 & 3) != 3) {  // if not on the right sub-blocks #3, #7, #11, #15
450
240k
    for (i = 0; i <= 2; ++i) {  // store future left samples
451
180k
      top[i] = blk[3 + (2 - i) * BPS];
452
180k
    }
453
60.1k
  } else {  // else replicate top-right samples, as says the specs.
454
52.7k
    for (i = 0; i <= 3; ++i) {
455
42.2k
      top[i] = top[i + 4];
456
42.2k
    }
457
10.5k
  }
458
  // move pointers to next sub-block
459
70.6k
  ++it->i4;
460
70.6k
  if (it->i4 == 16) {  // we're done
461
1.37k
    return 0;
462
1.37k
  }
463
464
69.3k
  it->i4_top = it->i4_boundary + VP8TopLeftI4[it->i4];
465
69.3k
  return 1;
466
70.6k
}
467
468
//------------------------------------------------------------------------------