Coverage Report

Created: 2023-06-07 06:03

/src/libjpeg-turbo.main/jdsample.c
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * jdsample.c
3
 *
4
 * This file was part of the Independent JPEG Group's software:
5
 * Copyright (C) 1991-1996, Thomas G. Lane.
6
 * libjpeg-turbo Modifications:
7
 * Copyright 2009 Pierre Ossman <ossman@cendio.se> for Cendio AB
8
 * Copyright (C) 2010, 2015-2016, 2022, D. R. Commander.
9
 * Copyright (C) 2014, MIPS Technologies, Inc., California.
10
 * Copyright (C) 2015, Google, Inc.
11
 * Copyright (C) 2019-2020, Arm Limited.
12
 * For conditions of distribution and use, see the accompanying README.ijg
13
 * file.
14
 *
15
 * This file contains upsampling routines.
16
 *
17
 * Upsampling input data is counted in "row groups".  A row group
18
 * is defined to be (v_samp_factor * DCT_scaled_size / min_DCT_scaled_size)
19
 * sample rows of each component.  Upsampling will normally produce
20
 * max_v_samp_factor pixel rows from each row group (but this could vary
21
 * if the upsampler is applying a scale factor of its own).
22
 *
23
 * An excellent reference for image resampling is
24
 *   Digital Image Warping, George Wolberg, 1990.
25
 *   Pub. by IEEE Computer Society Press, Los Alamitos, CA. ISBN 0-8186-8944-7.
26
 */
27
28
#include "jinclude.h"
29
#include "jdsample.h"
30
#include "jsimd.h"
31
#include "jpegapicomp.h"
32
33
34
35
#if BITS_IN_JSAMPLE != 16 || defined(D_LOSSLESS_SUPPORTED)
36
37
/*
38
 * Initialize for an upsampling pass.
39
 */
40
41
METHODDEF(void)
42
start_pass_upsample(j_decompress_ptr cinfo)
43
15.9k
{
44
15.9k
  my_upsample_ptr upsample = (my_upsample_ptr)cinfo->upsample;
45
46
  /* Mark the conversion buffer empty */
47
15.9k
  upsample->next_row_out = cinfo->max_v_samp_factor;
48
  /* Initialize total-height counter for detecting bottom of image */
49
15.9k
  upsample->rows_to_go = cinfo->output_height;
50
15.9k
}
51
52
53
/*
54
 * Control routine to do upsampling (and color conversion).
55
 *
56
 * In this version we upsample each component independently.
57
 * We upsample one row group into the conversion buffer, then apply
58
 * color conversion a row at a time.
59
 */
60
61
METHODDEF(void)
62
sep_upsample(j_decompress_ptr cinfo, _JSAMPIMAGE input_buf,
63
             JDIMENSION *in_row_group_ctr, JDIMENSION in_row_groups_avail,
64
             _JSAMPARRAY output_buf, JDIMENSION *out_row_ctr,
65
             JDIMENSION out_rows_avail)
66
38.0M
{
67
38.0M
  my_upsample_ptr upsample = (my_upsample_ptr)cinfo->upsample;
68
38.0M
  int ci;
69
38.0M
  jpeg_component_info *compptr;
70
38.0M
  JDIMENSION num_rows;
71
72
  /* Fill the conversion buffer, if it's empty */
73
38.0M
  if (upsample->next_row_out >= cinfo->max_v_samp_factor) {
74
97.1M
    for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
75
59.1M
         ci++, compptr++) {
76
      /* Invoke per-component upsample method.  Notice we pass a POINTER
77
       * to color_buf[ci], so that fullsize_upsample can change it.
78
       */
79
59.1M
      (*upsample->methods[ci]) (cinfo, compptr,
80
59.1M
        input_buf[ci] + (*in_row_group_ctr * upsample->rowgroup_height[ci]),
81
59.1M
        upsample->color_buf + ci);
82
59.1M
    }
83
38.0M
    upsample->next_row_out = 0;
84
38.0M
  }
85
86
  /* Color-convert and emit rows */
87
88
  /* How many we have in the buffer: */
89
38.0M
  num_rows = (JDIMENSION)(cinfo->max_v_samp_factor - upsample->next_row_out);
90
  /* Not more than the distance to the end of the image.  Need this test
91
   * in case the image height is not a multiple of max_v_samp_factor:
92
   */
93
38.0M
  if (num_rows > upsample->rows_to_go)
94
5.88k
    num_rows = upsample->rows_to_go;
95
  /* And not more than what the client can accept: */
96
38.0M
  out_rows_avail -= *out_row_ctr;
97
38.0M
  if (num_rows > out_rows_avail)
98
0
    num_rows = out_rows_avail;
99
100
38.0M
  (*cinfo->cconvert->_color_convert) (cinfo, upsample->color_buf,
101
38.0M
                                      (JDIMENSION)upsample->next_row_out,
102
38.0M
                                      output_buf + *out_row_ctr,
103
38.0M
                                      (int)num_rows);
104
105
  /* Adjust counts */
106
38.0M
  *out_row_ctr += num_rows;
107
38.0M
  upsample->rows_to_go -= num_rows;
108
38.0M
  upsample->next_row_out += num_rows;
109
  /* When the buffer is emptied, declare this input row group consumed */
110
38.0M
  if (upsample->next_row_out >= cinfo->max_v_samp_factor)
111
38.0M
    (*in_row_group_ctr)++;
112
38.0M
}
113
114
115
/*
116
 * These are the routines invoked by sep_upsample to upsample pixel values
117
 * of a single component.  One row group is processed per call.
118
 */
119
120
121
/*
122
 * For full-size components, we just make color_buf[ci] point at the
123
 * input buffer, and thus avoid copying any data.  Note that this is
124
 * safe only because sep_upsample doesn't declare the input row group
125
 * "consumed" until we are done color converting and emitting it.
126
 */
127
128
METHODDEF(void)
129
fullsize_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
130
                  _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
131
36.7M
{
132
36.7M
  *output_data_ptr = input_data;
133
36.7M
}
134
135
136
/*
137
 * This is a no-op version used for "uninteresting" components.
138
 * These components will not be referenced by color conversion.
139
 */
140
141
METHODDEF(void)
142
noop_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
143
              _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
144
5.14M
{
145
5.14M
  *output_data_ptr = NULL;      /* safety check */
146
5.14M
}
147
148
149
/*
150
 * This version handles any integral sampling ratios.
151
 * This is not used for typical JPEG files, so it need not be fast.
152
 * Nor, for that matter, is it particularly accurate: the algorithm is
153
 * simple replication of the input pixel onto the corresponding output
154
 * pixels.  The hi-falutin sampling literature refers to this as a
155
 * "box filter".  A box filter tends to introduce visible artifacts,
156
 * so if you are actually going to use 3:1 or 4:1 sampling ratios
157
 * you would be well advised to improve this code.
158
 */
159
160
METHODDEF(void)
161
int_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
162
             _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
163
10.2M
{
164
10.2M
  my_upsample_ptr upsample = (my_upsample_ptr)cinfo->upsample;
165
10.2M
  _JSAMPARRAY output_data = *output_data_ptr;
166
10.2M
  register _JSAMPROW inptr, outptr;
167
10.2M
  register _JSAMPLE invalue;
168
10.2M
  register int h;
169
10.2M
  _JSAMPROW outend;
170
10.2M
  int h_expand, v_expand;
171
10.2M
  int inrow, outrow;
172
173
10.2M
  h_expand = upsample->h_expand[compptr->component_index];
174
10.2M
  v_expand = upsample->v_expand[compptr->component_index];
175
176
10.2M
  inrow = outrow = 0;
177
22.5M
  while (outrow < cinfo->max_v_samp_factor) {
178
    /* Generate one output row with proper horizontal expansion */
179
12.2M
    inptr = input_data[inrow];
180
12.2M
    outptr = output_data[outrow];
181
12.2M
    outend = outptr + cinfo->output_width;
182
278M
    while (outptr < outend) {
183
266M
      invalue = *inptr++;
184
749M
      for (h = h_expand; h > 0; h--) {
185
483M
        *outptr++ = invalue;
186
483M
      }
187
266M
    }
188
    /* Generate any additional output rows by duplicating the first one */
189
12.2M
    if (v_expand > 1) {
190
6.82M
      _jcopy_sample_rows(output_data, outrow, output_data, outrow + 1,
191
6.82M
                         v_expand - 1, cinfo->output_width);
192
6.82M
    }
193
12.2M
    inrow++;
194
12.2M
    outrow += v_expand;
195
12.2M
  }
196
10.2M
}
197
198
199
/*
200
 * Fast processing for the common case of 2:1 horizontal and 1:1 vertical.
201
 * It's still a box filter.
202
 */
203
204
METHODDEF(void)
205
h2v1_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
206
              _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
207
847k
{
208
847k
  _JSAMPARRAY output_data = *output_data_ptr;
209
847k
  register _JSAMPROW inptr, outptr;
210
847k
  register _JSAMPLE invalue;
211
847k
  _JSAMPROW outend;
212
847k
  int inrow;
213
214
2.36M
  for (inrow = 0; inrow < cinfo->max_v_samp_factor; inrow++) {
215
1.51M
    inptr = input_data[inrow];
216
1.51M
    outptr = output_data[inrow];
217
1.51M
    outend = outptr + cinfo->output_width;
218
22.0M
    while (outptr < outend) {
219
20.5M
      invalue = *inptr++;
220
20.5M
      *outptr++ = invalue;
221
20.5M
      *outptr++ = invalue;
222
20.5M
    }
223
1.51M
  }
224
847k
}
225
226
227
/*
228
 * Fast processing for the common case of 2:1 horizontal and 2:1 vertical.
229
 * It's still a box filter.
230
 */
231
232
METHODDEF(void)
233
h2v2_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
234
              _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
235
253k
{
236
253k
  _JSAMPARRAY output_data = *output_data_ptr;
237
253k
  register _JSAMPROW inptr, outptr;
238
253k
  register _JSAMPLE invalue;
239
253k
  _JSAMPROW outend;
240
253k
  int inrow, outrow;
241
242
253k
  inrow = outrow = 0;
243
597k
  while (outrow < cinfo->max_v_samp_factor) {
244
343k
    inptr = input_data[inrow];
245
343k
    outptr = output_data[outrow];
246
343k
    outend = outptr + cinfo->output_width;
247
9.50M
    while (outptr < outend) {
248
9.16M
      invalue = *inptr++;
249
9.16M
      *outptr++ = invalue;
250
9.16M
      *outptr++ = invalue;
251
9.16M
    }
252
343k
    _jcopy_sample_rows(output_data, outrow, output_data, outrow + 1, 1,
253
343k
                       cinfo->output_width);
254
343k
    inrow++;
255
343k
    outrow += 2;
256
343k
  }
257
253k
}
258
259
260
/*
261
 * Fancy processing for the common case of 2:1 horizontal and 1:1 vertical.
262
 *
263
 * The upsampling algorithm is linear interpolation between pixel centers,
264
 * also known as a "triangle filter".  This is a good compromise between
265
 * speed and visual quality.  The centers of the output pixels are 1/4 and 3/4
266
 * of the way between input pixel centers.
267
 *
268
 * A note about the "bias" calculations: when rounding fractional values to
269
 * integer, we do not want to always round 0.5 up to the next integer.
270
 * If we did that, we'd introduce a noticeable bias towards larger values.
271
 * Instead, this code is arranged so that 0.5 will be rounded up or down at
272
 * alternate pixel locations (a simple ordered dither pattern).
273
 */
274
275
METHODDEF(void)
276
h2v1_fancy_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
277
                    _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
278
141k
{
279
141k
  _JSAMPARRAY output_data = *output_data_ptr;
280
141k
  register _JSAMPROW inptr, outptr;
281
141k
  register int invalue;
282
141k
  register JDIMENSION colctr;
283
141k
  int inrow;
284
285
506k
  for (inrow = 0; inrow < cinfo->max_v_samp_factor; inrow++) {
286
365k
    inptr = input_data[inrow];
287
365k
    outptr = output_data[inrow];
288
    /* Special case for first column */
289
365k
    invalue = *inptr++;
290
365k
    *outptr++ = (_JSAMPLE)invalue;
291
365k
    *outptr++ = (_JSAMPLE)((invalue * 3 + inptr[0] + 2) >> 2);
292
293
8.67M
    for (colctr = compptr->downsampled_width - 2; colctr > 0; colctr--) {
294
      /* General case: 3/4 * nearer pixel + 1/4 * further pixel */
295
8.31M
      invalue = (*inptr++) * 3;
296
8.31M
      *outptr++ = (_JSAMPLE)((invalue + inptr[-2] + 1) >> 2);
297
8.31M
      *outptr++ = (_JSAMPLE)((invalue + inptr[0] + 2) >> 2);
298
8.31M
    }
299
300
    /* Special case for last column */
301
365k
    invalue = *inptr;
302
365k
    *outptr++ = (_JSAMPLE)((invalue * 3 + inptr[-1] + 1) >> 2);
303
365k
    *outptr++ = (_JSAMPLE)invalue;
304
365k
  }
305
141k
}
306
307
308
/*
309
 * Fancy processing for 1:1 horizontal and 2:1 vertical (4:4:0 subsampling).
310
 *
311
 * This is a less common case, but it can be encountered when losslessly
312
 * rotating/transposing a JPEG file that uses 4:2:2 chroma subsampling.
313
 */
314
315
METHODDEF(void)
316
h1v2_fancy_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
317
                    _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
318
876k
{
319
876k
  _JSAMPARRAY output_data = *output_data_ptr;
320
876k
  _JSAMPROW inptr0, inptr1, outptr;
321
#if BITS_IN_JSAMPLE == 8
322
  int thiscolsum, bias;
323
#else
324
876k
  JLONG thiscolsum, bias;
325
876k
#endif
326
876k
  JDIMENSION colctr;
327
876k
  int inrow, outrow, v;
328
329
876k
  inrow = outrow = 0;
330
2.04M
  while (outrow < cinfo->max_v_samp_factor) {
331
3.51M
    for (v = 0; v < 2; v++) {
332
      /* inptr0 points to nearest input row, inptr1 points to next nearest */
333
2.34M
      inptr0 = input_data[inrow];
334
2.34M
      if (v == 0) {             /* next nearest is row above */
335
1.17M
        inptr1 = input_data[inrow - 1];
336
1.17M
        bias = 1;
337
1.17M
      } else {                  /* next nearest is row below */
338
1.17M
        inptr1 = input_data[inrow + 1];
339
1.17M
        bias = 2;
340
1.17M
      }
341
2.34M
      outptr = output_data[outrow++];
342
343
55.5M
      for (colctr = 0; colctr < compptr->downsampled_width; colctr++) {
344
53.1M
        thiscolsum = (*inptr0++) * 3 + (*inptr1++);
345
53.1M
        *outptr++ = (_JSAMPLE)((thiscolsum + bias) >> 2);
346
53.1M
      }
347
2.34M
    }
348
1.17M
    inrow++;
349
1.17M
  }
350
876k
}
351
352
353
/*
354
 * Fancy processing for the common case of 2:1 horizontal and 2:1 vertical.
355
 * Again a triangle filter; see comments for h2v1 case, above.
356
 *
357
 * It is OK for us to reference the adjacent input rows because we demanded
358
 * context from the main buffer controller (see initialization code).
359
 */
360
361
METHODDEF(void)
362
h2v2_fancy_upsample(j_decompress_ptr cinfo, jpeg_component_info *compptr,
363
                    _JSAMPARRAY input_data, _JSAMPARRAY *output_data_ptr)
364
41.3k
{
365
41.3k
  _JSAMPARRAY output_data = *output_data_ptr;
366
41.3k
  register _JSAMPROW inptr0, inptr1, outptr;
367
#if BITS_IN_JSAMPLE == 8
368
  register int thiscolsum, lastcolsum, nextcolsum;
369
#else
370
41.3k
  register JLONG thiscolsum, lastcolsum, nextcolsum;
371
41.3k
#endif
372
41.3k
  register JDIMENSION colctr;
373
41.3k
  int inrow, outrow, v;
374
375
41.3k
  inrow = outrow = 0;
376
93.9k
  while (outrow < cinfo->max_v_samp_factor) {
377
157k
    for (v = 0; v < 2; v++) {
378
      /* inptr0 points to nearest input row, inptr1 points to next nearest */
379
105k
      inptr0 = input_data[inrow];
380
105k
      if (v == 0)               /* next nearest is row above */
381
52.5k
        inptr1 = input_data[inrow - 1];
382
52.5k
      else                      /* next nearest is row below */
383
52.5k
        inptr1 = input_data[inrow + 1];
384
105k
      outptr = output_data[outrow++];
385
386
      /* Special case for first column */
387
105k
      thiscolsum = (*inptr0++) * 3 + (*inptr1++);
388
105k
      nextcolsum = (*inptr0++) * 3 + (*inptr1++);
389
105k
      *outptr++ = (_JSAMPLE)((thiscolsum * 4 + 8) >> 4);
390
105k
      *outptr++ = (_JSAMPLE)((thiscolsum * 3 + nextcolsum + 7) >> 4);
391
105k
      lastcolsum = thiscolsum;  thiscolsum = nextcolsum;
392
393
5.26M
      for (colctr = compptr->downsampled_width - 2; colctr > 0; colctr--) {
394
        /* General case: 3/4 * nearer pixel + 1/4 * further pixel in each */
395
        /* dimension, thus 9/16, 3/16, 3/16, 1/16 overall */
396
5.15M
        nextcolsum = (*inptr0++) * 3 + (*inptr1++);
397
5.15M
        *outptr++ = (_JSAMPLE)((thiscolsum * 3 + lastcolsum + 8) >> 4);
398
5.15M
        *outptr++ = (_JSAMPLE)((thiscolsum * 3 + nextcolsum + 7) >> 4);
399
5.15M
        lastcolsum = thiscolsum;  thiscolsum = nextcolsum;
400
5.15M
      }
401
402
      /* Special case for last column */
403
105k
      *outptr++ = (_JSAMPLE)((thiscolsum * 3 + lastcolsum + 8) >> 4);
404
105k
      *outptr++ = (_JSAMPLE)((thiscolsum * 4 + 7) >> 4);
405
105k
    }
406
52.5k
    inrow++;
407
52.5k
  }
408
41.3k
}
409
410
411
/*
412
 * Module initialization routine for upsampling.
413
 */
414
415
GLOBAL(void)
416
_jinit_upsampler(j_decompress_ptr cinfo)
417
8.20k
{
418
8.20k
  my_upsample_ptr upsample;
419
8.20k
  int ci;
420
8.20k
  jpeg_component_info *compptr;
421
8.20k
  boolean need_buffer, do_fancy;
422
8.20k
  int h_in_group, v_in_group, h_out_group, v_out_group;
423
424
8.20k
  if (cinfo->data_precision != BITS_IN_JSAMPLE)
425
0
    ERREXIT1(cinfo, JERR_BAD_PRECISION, cinfo->data_precision);
426
427
8.20k
  if (!cinfo->master->jinit_upsampler_no_alloc) {
428
8.20k
    upsample = (my_upsample_ptr)
429
8.20k
      (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
430
8.20k
                                  sizeof(my_upsampler));
431
8.20k
    cinfo->upsample = (struct jpeg_upsampler *)upsample;
432
8.20k
    upsample->pub.start_pass = start_pass_upsample;
433
8.20k
    upsample->pub._upsample = sep_upsample;
434
8.20k
    upsample->pub.need_context_rows = FALSE; /* until we find out differently */
435
8.20k
  } else
436
0
    upsample = (my_upsample_ptr)cinfo->upsample;
437
438
8.20k
  if (cinfo->CCIR601_sampling)  /* this isn't supported */
439
0
    ERREXIT(cinfo, JERR_CCIR601_NOTIMPL);
440
441
  /* jdmainct.c doesn't support context rows when min_DCT_scaled_size = 1,
442
   * so don't ask for it.
443
   */
444
8.20k
  do_fancy = cinfo->do_fancy_upsampling && cinfo->_min_DCT_scaled_size > 1;
445
446
  /* Verify we can handle the sampling factors, select per-component methods,
447
   * and create storage as needed.
448
   */
449
26.1k
  for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
450
17.9k
       ci++, compptr++) {
451
    /* Compute size of an "input group" after IDCT scaling.  This many samples
452
     * are to be converted to max_h_samp_factor * max_v_samp_factor pixels.
453
     */
454
17.9k
    h_in_group = (compptr->h_samp_factor * compptr->_DCT_scaled_size) /
455
17.9k
                 cinfo->_min_DCT_scaled_size;
456
17.9k
    v_in_group = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
457
17.9k
                 cinfo->_min_DCT_scaled_size;
458
17.9k
    h_out_group = cinfo->max_h_samp_factor;
459
17.9k
    v_out_group = cinfo->max_v_samp_factor;
460
17.9k
    upsample->rowgroup_height[ci] = v_in_group; /* save for use later */
461
17.9k
    need_buffer = TRUE;
462
17.9k
    if (!compptr->component_needed) {
463
      /* Don't bother to upsample an uninteresting component. */
464
1.24k
      upsample->methods[ci] = noop_upsample;
465
1.24k
      need_buffer = FALSE;
466
16.7k
    } else if (h_in_group == h_out_group && v_in_group == v_out_group) {
467
      /* Fullsize components can be processed without any work. */
468
8.12k
      upsample->methods[ci] = fullsize_upsample;
469
8.12k
      need_buffer = FALSE;
470
8.58k
    } else if (h_in_group * 2 == h_out_group && v_in_group == v_out_group) {
471
      /* Special cases for 2h1v upsampling */
472
2.16k
      if (do_fancy && compptr->downsampled_width > 2) {
473
#ifdef WITH_SIMD
474
70
        if (jsimd_can_h2v1_fancy_upsample())
475
70
          upsample->methods[ci] = jsimd_h2v1_fancy_upsample;
476
0
        else
477
0
#endif
478
0
          upsample->methods[ci] = h2v1_fancy_upsample;
479
1.93k
      } else {
480
#ifdef WITH_SIMD
481
599
        if (jsimd_can_h2v1_upsample())
482
599
          upsample->methods[ci] = jsimd_h2v1_upsample;
483
0
        else
484
0
#endif
485
0
          upsample->methods[ci] = h2v1_upsample;
486
1.93k
      }
487
6.41k
    } else if (h_in_group == h_out_group &&
488
6.41k
               v_in_group * 2 == v_out_group && do_fancy) {
489
      /* Non-fancy upsampling is handled by the generic method */
490
#if defined(WITH_SIMD) && (defined(__arm__) || defined(__aarch64__) || \
491
                           defined(_M_ARM) || defined(_M_ARM64))
492
      if (jsimd_can_h1v2_fancy_upsample())
493
        upsample->methods[ci] = jsimd_h1v2_fancy_upsample;
494
      else
495
#endif
496
316
        upsample->methods[ci] = h1v2_fancy_upsample;
497
316
      upsample->pub.need_context_rows = TRUE;
498
6.09k
    } else if (h_in_group * 2 == h_out_group &&
499
6.09k
               v_in_group * 2 == v_out_group) {
500
      /* Special cases for 2h2v upsampling */
501
2.80k
      if (do_fancy && compptr->downsampled_width > 2) {
502
#ifdef WITH_SIMD
503
25
        if (jsimd_can_h2v2_fancy_upsample())
504
25
          upsample->methods[ci] = jsimd_h2v2_fancy_upsample;
505
0
        else
506
0
#endif
507
0
          upsample->methods[ci] = h2v2_fancy_upsample;
508
68
        upsample->pub.need_context_rows = TRUE;
509
2.73k
      } else {
510
#ifdef WITH_SIMD
511
994
        if (jsimd_can_h2v2_upsample())
512
994
          upsample->methods[ci] = jsimd_h2v2_upsample;
513
0
        else
514
0
#endif
515
0
          upsample->methods[ci] = h2v2_upsample;
516
2.73k
      }
517
3.29k
    } else if ((h_out_group % h_in_group) == 0 &&
518
3.29k
               (v_out_group % v_in_group) == 0) {
519
      /* Generic integral-factors upsampling method */
520
#if defined(WITH_SIMD) && defined(__mips__)
521
      if (jsimd_can_int_upsample())
522
        upsample->methods[ci] = jsimd_int_upsample;
523
      else
524
#endif
525
3.26k
        upsample->methods[ci] = int_upsample;
526
3.26k
      upsample->h_expand[ci] = (UINT8)(h_out_group / h_in_group);
527
3.26k
      upsample->v_expand[ci] = (UINT8)(v_out_group / v_in_group);
528
3.26k
    } else
529
22
      ERREXIT(cinfo, JERR_FRACT_SAMPLE_NOTIMPL);
530
17.9k
    if (need_buffer && !cinfo->master->jinit_upsampler_no_alloc) {
531
8.55k
      upsample->color_buf[ci] = (_JSAMPARRAY)(*cinfo->mem->alloc_sarray)
532
8.55k
        ((j_common_ptr)cinfo, JPOOL_IMAGE,
533
8.55k
         (JDIMENSION)jround_up((long)cinfo->output_width,
534
8.55k
                               (long)cinfo->max_h_samp_factor),
535
8.55k
         (JDIMENSION)cinfo->max_v_samp_factor);
536
8.55k
    }
537
17.9k
  }
538
8.20k
}
j12init_upsampler
Line
Count
Source
417
3.59k
{
418
3.59k
  my_upsample_ptr upsample;
419
3.59k
  int ci;
420
3.59k
  jpeg_component_info *compptr;
421
3.59k
  boolean need_buffer, do_fancy;
422
3.59k
  int h_in_group, v_in_group, h_out_group, v_out_group;
423
424
3.59k
  if (cinfo->data_precision != BITS_IN_JSAMPLE)
425
0
    ERREXIT1(cinfo, JERR_BAD_PRECISION, cinfo->data_precision);
426
427
3.59k
  if (!cinfo->master->jinit_upsampler_no_alloc) {
428
3.59k
    upsample = (my_upsample_ptr)
429
3.59k
      (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
430
3.59k
                                  sizeof(my_upsampler));
431
3.59k
    cinfo->upsample = (struct jpeg_upsampler *)upsample;
432
3.59k
    upsample->pub.start_pass = start_pass_upsample;
433
3.59k
    upsample->pub._upsample = sep_upsample;
434
3.59k
    upsample->pub.need_context_rows = FALSE; /* until we find out differently */
435
3.59k
  } else
436
0
    upsample = (my_upsample_ptr)cinfo->upsample;
437
438
3.59k
  if (cinfo->CCIR601_sampling)  /* this isn't supported */
439
0
    ERREXIT(cinfo, JERR_CCIR601_NOTIMPL);
440
441
  /* jdmainct.c doesn't support context rows when min_DCT_scaled_size = 1,
442
   * so don't ask for it.
443
   */
444
3.59k
  do_fancy = cinfo->do_fancy_upsampling && cinfo->_min_DCT_scaled_size > 1;
445
446
  /* Verify we can handle the sampling factors, select per-component methods,
447
   * and create storage as needed.
448
   */
449
11.7k
  for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
450
8.13k
       ci++, compptr++) {
451
    /* Compute size of an "input group" after IDCT scaling.  This many samples
452
     * are to be converted to max_h_samp_factor * max_v_samp_factor pixels.
453
     */
454
8.13k
    h_in_group = (compptr->h_samp_factor * compptr->_DCT_scaled_size) /
455
8.13k
                 cinfo->_min_DCT_scaled_size;
456
8.13k
    v_in_group = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
457
8.13k
                 cinfo->_min_DCT_scaled_size;
458
8.13k
    h_out_group = cinfo->max_h_samp_factor;
459
8.13k
    v_out_group = cinfo->max_v_samp_factor;
460
8.13k
    upsample->rowgroup_height[ci] = v_in_group; /* save for use later */
461
8.13k
    need_buffer = TRUE;
462
8.13k
    if (!compptr->component_needed) {
463
      /* Don't bother to upsample an uninteresting component. */
464
844
      upsample->methods[ci] = noop_upsample;
465
844
      need_buffer = FALSE;
466
7.28k
    } else if (h_in_group == h_out_group && v_in_group == v_out_group) {
467
      /* Fullsize components can be processed without any work. */
468
3.84k
      upsample->methods[ci] = fullsize_upsample;
469
3.84k
      need_buffer = FALSE;
470
3.84k
    } else if (h_in_group * 2 == h_out_group && v_in_group == v_out_group) {
471
      /* Special cases for 2h1v upsampling */
472
799
      if (do_fancy && compptr->downsampled_width > 2) {
473
#ifdef WITH_SIMD
474
        if (jsimd_can_h2v1_fancy_upsample())
475
          upsample->methods[ci] = jsimd_h2v1_fancy_upsample;
476
        else
477
#endif
478
167
          upsample->methods[ci] = h2v1_fancy_upsample;
479
632
      } else {
480
#ifdef WITH_SIMD
481
        if (jsimd_can_h2v1_upsample())
482
          upsample->methods[ci] = jsimd_h2v1_upsample;
483
        else
484
#endif
485
632
          upsample->methods[ci] = h2v1_upsample;
486
632
      }
487
2.64k
    } else if (h_in_group == h_out_group &&
488
2.64k
               v_in_group * 2 == v_out_group && do_fancy) {
489
      /* Non-fancy upsampling is handled by the generic method */
490
#if defined(WITH_SIMD) && (defined(__arm__) || defined(__aarch64__) || \
491
                           defined(_M_ARM) || defined(_M_ARM64))
492
      if (jsimd_can_h1v2_fancy_upsample())
493
        upsample->methods[ci] = jsimd_h1v2_fancy_upsample;
494
      else
495
#endif
496
205
        upsample->methods[ci] = h1v2_fancy_upsample;
497
205
      upsample->pub.need_context_rows = TRUE;
498
2.44k
    } else if (h_in_group * 2 == h_out_group &&
499
2.44k
               v_in_group * 2 == v_out_group) {
500
      /* Special cases for 2h2v upsampling */
501
1.05k
      if (do_fancy && compptr->downsampled_width > 2) {
502
#ifdef WITH_SIMD
503
        if (jsimd_can_h2v2_fancy_upsample())
504
          upsample->methods[ci] = jsimd_h2v2_fancy_upsample;
505
        else
506
#endif
507
43
          upsample->methods[ci] = h2v2_fancy_upsample;
508
43
        upsample->pub.need_context_rows = TRUE;
509
1.01k
      } else {
510
#ifdef WITH_SIMD
511
        if (jsimd_can_h2v2_upsample())
512
          upsample->methods[ci] = jsimd_h2v2_upsample;
513
        else
514
#endif
515
1.01k
          upsample->methods[ci] = h2v2_upsample;
516
1.01k
      }
517
1.38k
    } else if ((h_out_group % h_in_group) == 0 &&
518
1.38k
               (v_out_group % v_in_group) == 0) {
519
      /* Generic integral-factors upsampling method */
520
#if defined(WITH_SIMD) && defined(__mips__)
521
      if (jsimd_can_int_upsample())
522
        upsample->methods[ci] = jsimd_int_upsample;
523
      else
524
#endif
525
1.38k
        upsample->methods[ci] = int_upsample;
526
1.38k
      upsample->h_expand[ci] = (UINT8)(h_out_group / h_in_group);
527
1.38k
      upsample->v_expand[ci] = (UINT8)(v_out_group / v_in_group);
528
1.38k
    } else
529
9
      ERREXIT(cinfo, JERR_FRACT_SAMPLE_NOTIMPL);
530
8.13k
    if (need_buffer && !cinfo->master->jinit_upsampler_no_alloc) {
531
3.43k
      upsample->color_buf[ci] = (_JSAMPARRAY)(*cinfo->mem->alloc_sarray)
532
3.43k
        ((j_common_ptr)cinfo, JPOOL_IMAGE,
533
3.43k
         (JDIMENSION)jround_up((long)cinfo->output_width,
534
3.43k
                               (long)cinfo->max_h_samp_factor),
535
3.43k
         (JDIMENSION)cinfo->max_v_samp_factor);
536
3.43k
    }
537
8.13k
  }
538
3.59k
}
jinit_upsampler
Line
Count
Source
417
3.70k
{
418
3.70k
  my_upsample_ptr upsample;
419
3.70k
  int ci;
420
3.70k
  jpeg_component_info *compptr;
421
3.70k
  boolean need_buffer, do_fancy;
422
3.70k
  int h_in_group, v_in_group, h_out_group, v_out_group;
423
424
3.70k
  if (cinfo->data_precision != BITS_IN_JSAMPLE)
425
0
    ERREXIT1(cinfo, JERR_BAD_PRECISION, cinfo->data_precision);
426
427
3.70k
  if (!cinfo->master->jinit_upsampler_no_alloc) {
428
3.70k
    upsample = (my_upsample_ptr)
429
3.70k
      (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
430
3.70k
                                  sizeof(my_upsampler));
431
3.70k
    cinfo->upsample = (struct jpeg_upsampler *)upsample;
432
3.70k
    upsample->pub.start_pass = start_pass_upsample;
433
3.70k
    upsample->pub._upsample = sep_upsample;
434
3.70k
    upsample->pub.need_context_rows = FALSE; /* until we find out differently */
435
3.70k
  } else
436
0
    upsample = (my_upsample_ptr)cinfo->upsample;
437
438
3.70k
  if (cinfo->CCIR601_sampling)  /* this isn't supported */
439
0
    ERREXIT(cinfo, JERR_CCIR601_NOTIMPL);
440
441
  /* jdmainct.c doesn't support context rows when min_DCT_scaled_size = 1,
442
   * so don't ask for it.
443
   */
444
3.70k
  do_fancy = cinfo->do_fancy_upsampling && cinfo->_min_DCT_scaled_size > 1;
445
446
  /* Verify we can handle the sampling factors, select per-component methods,
447
   * and create storage as needed.
448
   */
449
10.8k
  for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
450
7.11k
       ci++, compptr++) {
451
    /* Compute size of an "input group" after IDCT scaling.  This many samples
452
     * are to be converted to max_h_samp_factor * max_v_samp_factor pixels.
453
     */
454
7.11k
    h_in_group = (compptr->h_samp_factor * compptr->_DCT_scaled_size) /
455
7.11k
                 cinfo->_min_DCT_scaled_size;
456
7.11k
    v_in_group = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
457
7.11k
                 cinfo->_min_DCT_scaled_size;
458
7.11k
    h_out_group = cinfo->max_h_samp_factor;
459
7.11k
    v_out_group = cinfo->max_v_samp_factor;
460
7.11k
    upsample->rowgroup_height[ci] = v_in_group; /* save for use later */
461
7.11k
    need_buffer = TRUE;
462
7.11k
    if (!compptr->component_needed) {
463
      /* Don't bother to upsample an uninteresting component. */
464
404
      upsample->methods[ci] = noop_upsample;
465
404
      need_buffer = FALSE;
466
6.71k
    } else if (h_in_group == h_out_group && v_in_group == v_out_group) {
467
      /* Fullsize components can be processed without any work. */
468
3.65k
      upsample->methods[ci] = fullsize_upsample;
469
3.65k
      need_buffer = FALSE;
470
3.65k
    } else if (h_in_group * 2 == h_out_group && v_in_group == v_out_group) {
471
      /* Special cases for 2h1v upsampling */
472
669
      if (do_fancy && compptr->downsampled_width > 2) {
473
70
#ifdef WITH_SIMD
474
70
        if (jsimd_can_h2v1_fancy_upsample())
475
70
          upsample->methods[ci] = jsimd_h2v1_fancy_upsample;
476
0
        else
477
0
#endif
478
0
          upsample->methods[ci] = h2v1_fancy_upsample;
479
599
      } else {
480
599
#ifdef WITH_SIMD
481
599
        if (jsimd_can_h2v1_upsample())
482
599
          upsample->methods[ci] = jsimd_h2v1_upsample;
483
0
        else
484
0
#endif
485
0
          upsample->methods[ci] = h2v1_upsample;
486
599
      }
487
2.39k
    } else if (h_in_group == h_out_group &&
488
2.39k
               v_in_group * 2 == v_out_group && do_fancy) {
489
      /* Non-fancy upsampling is handled by the generic method */
490
#if defined(WITH_SIMD) && (defined(__arm__) || defined(__aarch64__) || \
491
                           defined(_M_ARM) || defined(_M_ARM64))
492
      if (jsimd_can_h1v2_fancy_upsample())
493
        upsample->methods[ci] = jsimd_h1v2_fancy_upsample;
494
      else
495
#endif
496
111
        upsample->methods[ci] = h1v2_fancy_upsample;
497
111
      upsample->pub.need_context_rows = TRUE;
498
2.28k
    } else if (h_in_group * 2 == h_out_group &&
499
2.28k
               v_in_group * 2 == v_out_group) {
500
      /* Special cases for 2h2v upsampling */
501
1.01k
      if (do_fancy && compptr->downsampled_width > 2) {
502
25
#ifdef WITH_SIMD
503
25
        if (jsimd_can_h2v2_fancy_upsample())
504
25
          upsample->methods[ci] = jsimd_h2v2_fancy_upsample;
505
0
        else
506
0
#endif
507
0
          upsample->methods[ci] = h2v2_fancy_upsample;
508
25
        upsample->pub.need_context_rows = TRUE;
509
994
      } else {
510
994
#ifdef WITH_SIMD
511
994
        if (jsimd_can_h2v2_upsample())
512
994
          upsample->methods[ci] = jsimd_h2v2_upsample;
513
0
        else
514
0
#endif
515
0
          upsample->methods[ci] = h2v2_upsample;
516
994
      }
517
1.26k
    } else if ((h_out_group % h_in_group) == 0 &&
518
1.26k
               (v_out_group % v_in_group) == 0) {
519
      /* Generic integral-factors upsampling method */
520
#if defined(WITH_SIMD) && defined(__mips__)
521
      if (jsimd_can_int_upsample())
522
        upsample->methods[ci] = jsimd_int_upsample;
523
      else
524
#endif
525
1.25k
        upsample->methods[ci] = int_upsample;
526
1.25k
      upsample->h_expand[ci] = (UINT8)(h_out_group / h_in_group);
527
1.25k
      upsample->v_expand[ci] = (UINT8)(v_out_group / v_in_group);
528
1.25k
    } else
529
6
      ERREXIT(cinfo, JERR_FRACT_SAMPLE_NOTIMPL);
530
7.11k
    if (need_buffer && !cinfo->master->jinit_upsampler_no_alloc) {
531
3.05k
      upsample->color_buf[ci] = (_JSAMPARRAY)(*cinfo->mem->alloc_sarray)
532
3.05k
        ((j_common_ptr)cinfo, JPOOL_IMAGE,
533
3.05k
         (JDIMENSION)jround_up((long)cinfo->output_width,
534
3.05k
                               (long)cinfo->max_h_samp_factor),
535
3.05k
         (JDIMENSION)cinfo->max_v_samp_factor);
536
3.05k
    }
537
7.11k
  }
538
3.70k
}
j16init_upsampler
Line
Count
Source
417
911
{
418
911
  my_upsample_ptr upsample;
419
911
  int ci;
420
911
  jpeg_component_info *compptr;
421
911
  boolean need_buffer, do_fancy;
422
911
  int h_in_group, v_in_group, h_out_group, v_out_group;
423
424
911
  if (cinfo->data_precision != BITS_IN_JSAMPLE)
425
0
    ERREXIT1(cinfo, JERR_BAD_PRECISION, cinfo->data_precision);
426
427
911
  if (!cinfo->master->jinit_upsampler_no_alloc) {
428
911
    upsample = (my_upsample_ptr)
429
911
      (*cinfo->mem->alloc_small) ((j_common_ptr)cinfo, JPOOL_IMAGE,
430
911
                                  sizeof(my_upsampler));
431
911
    cinfo->upsample = (struct jpeg_upsampler *)upsample;
432
911
    upsample->pub.start_pass = start_pass_upsample;
433
911
    upsample->pub._upsample = sep_upsample;
434
911
    upsample->pub.need_context_rows = FALSE; /* until we find out differently */
435
911
  } else
436
0
    upsample = (my_upsample_ptr)cinfo->upsample;
437
438
911
  if (cinfo->CCIR601_sampling)  /* this isn't supported */
439
0
    ERREXIT(cinfo, JERR_CCIR601_NOTIMPL);
440
441
  /* jdmainct.c doesn't support context rows when min_DCT_scaled_size = 1,
442
   * so don't ask for it.
443
   */
444
911
  do_fancy = cinfo->do_fancy_upsampling && cinfo->_min_DCT_scaled_size > 1;
445
446
  /* Verify we can handle the sampling factors, select per-component methods,
447
   * and create storage as needed.
448
   */
449
3.61k
  for (ci = 0, compptr = cinfo->comp_info; ci < cinfo->num_components;
450
2.70k
       ci++, compptr++) {
451
    /* Compute size of an "input group" after IDCT scaling.  This many samples
452
     * are to be converted to max_h_samp_factor * max_v_samp_factor pixels.
453
     */
454
2.70k
    h_in_group = (compptr->h_samp_factor * compptr->_DCT_scaled_size) /
455
2.70k
                 cinfo->_min_DCT_scaled_size;
456
2.70k
    v_in_group = (compptr->v_samp_factor * compptr->_DCT_scaled_size) /
457
2.70k
                 cinfo->_min_DCT_scaled_size;
458
2.70k
    h_out_group = cinfo->max_h_samp_factor;
459
2.70k
    v_out_group = cinfo->max_v_samp_factor;
460
2.70k
    upsample->rowgroup_height[ci] = v_in_group; /* save for use later */
461
2.70k
    need_buffer = TRUE;
462
2.70k
    if (!compptr->component_needed) {
463
      /* Don't bother to upsample an uninteresting component. */
464
0
      upsample->methods[ci] = noop_upsample;
465
0
      need_buffer = FALSE;
466
2.70k
    } else if (h_in_group == h_out_group && v_in_group == v_out_group) {
467
      /* Fullsize components can be processed without any work. */
468
633
      upsample->methods[ci] = fullsize_upsample;
469
633
      need_buffer = FALSE;
470
2.07k
    } else if (h_in_group * 2 == h_out_group && v_in_group == v_out_group) {
471
      /* Special cases for 2h1v upsampling */
472
699
      if (do_fancy && compptr->downsampled_width > 2) {
473
#ifdef WITH_SIMD
474
        if (jsimd_can_h2v1_fancy_upsample())
475
          upsample->methods[ci] = jsimd_h2v1_fancy_upsample;
476
        else
477
#endif
478
0
          upsample->methods[ci] = h2v1_fancy_upsample;
479
699
      } else {
480
#ifdef WITH_SIMD
481
        if (jsimd_can_h2v1_upsample())
482
          upsample->methods[ci] = jsimd_h2v1_upsample;
483
        else
484
#endif
485
699
          upsample->methods[ci] = h2v1_upsample;
486
699
      }
487
1.37k
    } else if (h_in_group == h_out_group &&
488
1.37k
               v_in_group * 2 == v_out_group && do_fancy) {
489
      /* Non-fancy upsampling is handled by the generic method */
490
#if defined(WITH_SIMD) && (defined(__arm__) || defined(__aarch64__) || \
491
                           defined(_M_ARM) || defined(_M_ARM64))
492
      if (jsimd_can_h1v2_fancy_upsample())
493
        upsample->methods[ci] = jsimd_h1v2_fancy_upsample;
494
      else
495
#endif
496
0
        upsample->methods[ci] = h1v2_fancy_upsample;
497
0
      upsample->pub.need_context_rows = TRUE;
498
1.37k
    } else if (h_in_group * 2 == h_out_group &&
499
1.37k
               v_in_group * 2 == v_out_group) {
500
      /* Special cases for 2h2v upsampling */
501
734
      if (do_fancy && compptr->downsampled_width > 2) {
502
#ifdef WITH_SIMD
503
        if (jsimd_can_h2v2_fancy_upsample())
504
          upsample->methods[ci] = jsimd_h2v2_fancy_upsample;
505
        else
506
#endif
507
0
          upsample->methods[ci] = h2v2_fancy_upsample;
508
0
        upsample->pub.need_context_rows = TRUE;
509
734
      } else {
510
#ifdef WITH_SIMD
511
        if (jsimd_can_h2v2_upsample())
512
          upsample->methods[ci] = jsimd_h2v2_upsample;
513
        else
514
#endif
515
734
          upsample->methods[ci] = h2v2_upsample;
516
734
      }
517
734
    } else if ((h_out_group % h_in_group) == 0 &&
518
641
               (v_out_group % v_in_group) == 0) {
519
      /* Generic integral-factors upsampling method */
520
#if defined(WITH_SIMD) && defined(__mips__)
521
      if (jsimd_can_int_upsample())
522
        upsample->methods[ci] = jsimd_int_upsample;
523
      else
524
#endif
525
634
        upsample->methods[ci] = int_upsample;
526
634
      upsample->h_expand[ci] = (UINT8)(h_out_group / h_in_group);
527
634
      upsample->v_expand[ci] = (UINT8)(v_out_group / v_in_group);
528
634
    } else
529
7
      ERREXIT(cinfo, JERR_FRACT_SAMPLE_NOTIMPL);
530
2.70k
    if (need_buffer && !cinfo->master->jinit_upsampler_no_alloc) {
531
2.06k
      upsample->color_buf[ci] = (_JSAMPARRAY)(*cinfo->mem->alloc_sarray)
532
2.06k
        ((j_common_ptr)cinfo, JPOOL_IMAGE,
533
2.06k
         (JDIMENSION)jround_up((long)cinfo->output_width,
534
2.06k
                               (long)cinfo->max_h_samp_factor),
535
2.06k
         (JDIMENSION)cinfo->max_v_samp_factor);
536
2.06k
    }
537
2.70k
  }
538
911
}
539
540
#endif /* BITS_IN_JSAMPLE != 16 || defined(D_LOSSLESS_SUPPORTED) */