Coverage Report

Created: 2023-06-07 06:31

/src/aom/av1/common/cfl.h
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#ifndef AOM_AV1_COMMON_CFL_H_
13
#define AOM_AV1_COMMON_CFL_H_
14
15
#include "av1/common/av1_common_int.h"
16
#include "av1/common/blockd.h"
17
18
// Can we use CfL for the current block?
19
11.9M
static INLINE CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
11.9M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
11.9M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
11.9M
  assert(bsize < BLOCK_SIZES_ALL);
23
11.9M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
158k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
158k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
158k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
158k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
158k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
11.7M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
11.7M
                            block_size_high[bsize] <= 32);
34
11.9M
}
Unexecuted instantiation: decodeframe.c:is_cfl_allowed
decodemv.c:is_cfl_allowed
Line
Count
Source
19
9.33M
static INLINE CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
9.33M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
9.33M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
9.33M
  assert(bsize < BLOCK_SIZES_ALL);
23
9.33M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
156k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
156k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
156k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
156k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
156k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
9.17M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
9.17M
                            block_size_high[bsize] <= 32);
34
9.33M
}
cfl.c:is_cfl_allowed
Line
Count
Source
19
2.60M
static INLINE CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
2.60M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
2.60M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
2.60M
  assert(bsize < BLOCK_SIZES_ALL);
23
2.60M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
2.61k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
2.61k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
2.61k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
2.61k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
2.61k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
2.60M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
2.60M
                            block_size_high[bsize] <= 32);
34
2.60M
}
Unexecuted instantiation: reconintra.c:is_cfl_allowed
Unexecuted instantiation: cfl_sse2.c:is_cfl_allowed
Unexecuted instantiation: cfl_ssse3.c:is_cfl_allowed
Unexecuted instantiation: cfl_avx2.c:is_cfl_allowed
35
36
// Do we need to save the luma pixels from the current block,
37
// for a possible future CfL prediction?
38
static INLINE CFL_ALLOWED_TYPE store_cfl_required(const AV1_COMMON *cm,
39
59.9M
                                                  const MACROBLOCKD *xd) {
40
59.9M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
59.9M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
58.6M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
3.55M
    return CFL_ALLOWED;
51
3.55M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
55.1M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
55.1M
                            mbmi->uv_mode == UV_CFL_PRED);
57
58.6M
}
decodeframe.c:store_cfl_required
Line
Count
Source
39
43.4M
                                                  const MACROBLOCKD *xd) {
40
43.4M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
43.4M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
42.3M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
1.73M
    return CFL_ALLOWED;
51
1.73M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
40.6M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
40.6M
                            mbmi->uv_mode == UV_CFL_PRED);
57
42.3M
}
decodemv.c:store_cfl_required
Line
Count
Source
39
16.5M
                                                  const MACROBLOCKD *xd) {
40
16.5M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
16.5M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
16.3M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
1.81M
    return CFL_ALLOWED;
51
1.81M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
14.5M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
14.5M
                            mbmi->uv_mode == UV_CFL_PRED);
57
16.3M
}
Unexecuted instantiation: cfl.c:store_cfl_required
Unexecuted instantiation: reconintra.c:store_cfl_required
Unexecuted instantiation: cfl_sse2.c:store_cfl_required
Unexecuted instantiation: cfl_ssse3.c:store_cfl_required
Unexecuted instantiation: cfl_avx2.c:store_cfl_required
58
59
0
static INLINE int get_scaled_luma_q0(int alpha_q3, int16_t pred_buf_q3) {
60
0
  int scaled_luma_q6 = alpha_q3 * pred_buf_q3;
61
0
  return ROUND_POWER_OF_TWO_SIGNED(scaled_luma_q6, 6);
62
0
}
Unexecuted instantiation: decodeframe.c:get_scaled_luma_q0
Unexecuted instantiation: decodemv.c:get_scaled_luma_q0
Unexecuted instantiation: cfl.c:get_scaled_luma_q0
Unexecuted instantiation: reconintra.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_sse2.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_ssse3.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_avx2.c:get_scaled_luma_q0
63
64
2.60M
static INLINE CFL_PRED_TYPE get_cfl_pred_type(int plane) {
65
2.60M
  assert(plane > 0);
66
0
  return (CFL_PRED_TYPE)(plane - 1);
67
2.60M
}
Unexecuted instantiation: decodeframe.c:get_cfl_pred_type
Unexecuted instantiation: decodemv.c:get_cfl_pred_type
Unexecuted instantiation: cfl.c:get_cfl_pred_type
reconintra.c:get_cfl_pred_type
Line
Count
Source
64
2.60M
static INLINE CFL_PRED_TYPE get_cfl_pred_type(int plane) {
65
2.60M
  assert(plane > 0);
66
0
  return (CFL_PRED_TYPE)(plane - 1);
67
2.60M
}
Unexecuted instantiation: cfl_sse2.c:get_cfl_pred_type
Unexecuted instantiation: cfl_ssse3.c:get_cfl_pred_type
Unexecuted instantiation: cfl_avx2.c:get_cfl_pred_type
68
69
264k
static INLINE void clear_cfl_dc_pred_cache_flags(CFL_CTX *cfl) {
70
264k
  cfl->use_dc_pred_cache = false;
71
264k
  cfl->dc_pred_is_cached[CFL_PRED_U] = false;
72
264k
  cfl->dc_pred_is_cached[CFL_PRED_V] = false;
73
264k
}
Unexecuted instantiation: decodeframe.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: decodemv.c:clear_cfl_dc_pred_cache_flags
cfl.c:clear_cfl_dc_pred_cache_flags
Line
Count
Source
69
264k
static INLINE void clear_cfl_dc_pred_cache_flags(CFL_CTX *cfl) {
70
264k
  cfl->use_dc_pred_cache = false;
71
264k
  cfl->dc_pred_is_cached[CFL_PRED_U] = false;
72
264k
  cfl->dc_pred_is_cached[CFL_PRED_V] = false;
73
264k
}
Unexecuted instantiation: reconintra.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_sse2.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_ssse3.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_avx2.c:clear_cfl_dc_pred_cache_flags
74
75
void cfl_predict_block(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
76
                       TX_SIZE tx_size, int plane);
77
78
void cfl_store_block(MACROBLOCKD *const xd, BLOCK_SIZE bsize, TX_SIZE tx_size);
79
80
void cfl_store_tx(MACROBLOCKD *const xd, int row, int col, TX_SIZE tx_size,
81
                  BLOCK_SIZE bsize);
82
83
void cfl_store_dc_pred(MACROBLOCKD *const xd, const uint8_t *input,
84
                       CFL_PRED_TYPE pred_plane, int width);
85
86
void cfl_load_dc_pred(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
87
                      TX_SIZE tx_size, CFL_PRED_TYPE pred_plane);
88
89
// Allows the CFL_SUBSAMPLE function to switch types depending on the bitdepth.
90
#define CFL_lbd_TYPE uint8_t *cfl_type
91
#define CFL_hbd_TYPE uint16_t *cfl_type
92
93
// Declare a size-specific wrapper for the size-generic function. The compiler
94
// will inline the size generic function in here, the advantage is that the size
95
// will be constant allowing for loop unrolling and other constant propagated
96
// goodness.
97
#define CFL_SUBSAMPLE(arch, sub, bd, width, height)                       \
98
  void cfl_subsample_##bd##_##sub##_##width##x##height##_##arch(          \
99
3.31M
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
3.31M
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
3.31M
                                               output_q3, width, height); \
102
3.31M
  }
Unexecuted instantiation: cfl_subsample_lbd_420_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x8_c
cfl_subsample_lbd_420_4x4_ssse3
Line
Count
Source
99
499k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
499k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
499k
                                               output_q3, width, height); \
102
499k
  }
cfl_subsample_lbd_420_8x8_ssse3
Line
Count
Source
99
134k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
134k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
134k
                                               output_q3, width, height); \
102
134k
  }
cfl_subsample_lbd_420_16x16_ssse3
Line
Count
Source
99
51.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
51.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
51.0k
                                               output_q3, width, height); \
102
51.0k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x32_ssse3
cfl_subsample_lbd_420_4x8_ssse3
Line
Count
Source
99
210k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
210k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
210k
                                               output_q3, width, height); \
102
210k
  }
cfl_subsample_lbd_420_8x4_ssse3
Line
Count
Source
99
252k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
252k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
252k
                                               output_q3, width, height); \
102
252k
  }
cfl_subsample_lbd_420_8x16_ssse3
Line
Count
Source
99
28.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
28.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
28.4k
                                               output_q3, width, height); \
102
28.4k
  }
cfl_subsample_lbd_420_16x8_ssse3
Line
Count
Source
99
46.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
46.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
46.7k
                                               output_q3, width, height); \
102
46.7k
  }
cfl_subsample_lbd_420_16x32_ssse3
Line
Count
Source
99
8.98k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
8.98k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
8.98k
                                               output_q3, width, height); \
102
8.98k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x16_ssse3
cfl_subsample_lbd_420_4x16_ssse3
Line
Count
Source
99
216k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
216k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
216k
                                               output_q3, width, height); \
102
216k
  }
cfl_subsample_lbd_420_16x4_ssse3
Line
Count
Source
99
272k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
272k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
272k
                                               output_q3, width, height); \
102
272k
  }
cfl_subsample_lbd_420_8x32_ssse3
Line
Count
Source
99
14.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
14.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
14.7k
                                               output_q3, width, height); \
102
14.7k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x8_ssse3
cfl_subsample_lbd_422_4x4_ssse3
Line
Count
Source
99
1.00k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
1.00k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
1.00k
                                               output_q3, width, height); \
102
1.00k
  }
cfl_subsample_lbd_422_8x8_ssse3
Line
Count
Source
99
364
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
364
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
364
                                               output_q3, width, height); \
102
364
  }
cfl_subsample_lbd_422_16x16_ssse3
Line
Count
Source
99
289
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
289
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
289
                                               output_q3, width, height); \
102
289
  }
Unexecuted instantiation: cfl_subsample_lbd_422_32x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_4x8_ssse3
cfl_subsample_lbd_422_8x4_ssse3
Line
Count
Source
99
152
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
152
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
152
                                               output_q3, width, height); \
102
152
  }
Unexecuted instantiation: cfl_subsample_lbd_422_8x16_ssse3
cfl_subsample_lbd_422_16x8_ssse3
Line
Count
Source
99
1.23k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
1.23k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
1.23k
                                               output_q3, width, height); \
102
1.23k
  }
Unexecuted instantiation: cfl_subsample_lbd_422_16x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_32x16_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_4x16_ssse3
cfl_subsample_lbd_422_16x4_ssse3
Line
Count
Source
99
868
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
868
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
868
                                               output_q3, width, height); \
102
868
  }
Unexecuted instantiation: cfl_subsample_lbd_422_8x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_32x8_ssse3
cfl_subsample_lbd_444_4x4_ssse3
Line
Count
Source
99
41.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
41.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
41.2k
                                               output_q3, width, height); \
102
41.2k
  }
cfl_subsample_lbd_444_8x8_ssse3
Line
Count
Source
99
46.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
46.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
46.2k
                                               output_q3, width, height); \
102
46.2k
  }
cfl_subsample_lbd_444_16x16_ssse3
Line
Count
Source
99
28.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
28.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
28.6k
                                               output_q3, width, height); \
102
28.6k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x32_ssse3
cfl_subsample_lbd_444_4x8_ssse3
Line
Count
Source
99
10.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
10.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
10.1k
                                               output_q3, width, height); \
102
10.1k
  }
cfl_subsample_lbd_444_8x4_ssse3
Line
Count
Source
99
14.9k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
14.9k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
14.9k
                                               output_q3, width, height); \
102
14.9k
  }
cfl_subsample_lbd_444_8x16_ssse3
Line
Count
Source
99
15.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
15.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
15.0k
                                               output_q3, width, height); \
102
15.0k
  }
cfl_subsample_lbd_444_16x8_ssse3
Line
Count
Source
99
23.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
23.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
23.0k
                                               output_q3, width, height); \
102
23.0k
  }
cfl_subsample_lbd_444_16x32_ssse3
Line
Count
Source
99
7.79k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
7.79k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
7.79k
                                               output_q3, width, height); \
102
7.79k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x16_ssse3
cfl_subsample_lbd_444_4x16_ssse3
Line
Count
Source
99
40.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
40.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
40.6k
                                               output_q3, width, height); \
102
40.6k
  }
cfl_subsample_lbd_444_16x4_ssse3
Line
Count
Source
99
38.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
38.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
38.2k
                                               output_q3, width, height); \
102
38.2k
  }
cfl_subsample_lbd_444_8x32_ssse3
Line
Count
Source
99
15.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
15.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
15.4k
                                               output_q3, width, height); \
102
15.4k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x8_ssse3
cfl_subsample_hbd_420_4x4_ssse3
Line
Count
Source
99
113k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
113k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
113k
                                               output_q3, width, height); \
102
113k
  }
cfl_subsample_hbd_420_8x8_ssse3
Line
Count
Source
99
31.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
31.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
31.1k
                                               output_q3, width, height); \
102
31.1k
  }
cfl_subsample_hbd_420_16x16_ssse3
Line
Count
Source
99
18.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
18.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
18.0k
                                               output_q3, width, height); \
102
18.0k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x32_ssse3
cfl_subsample_hbd_420_4x8_ssse3
Line
Count
Source
99
73.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
73.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
73.2k
                                               output_q3, width, height); \
102
73.2k
  }
cfl_subsample_hbd_420_8x4_ssse3
Line
Count
Source
99
84.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
84.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
84.6k
                                               output_q3, width, height); \
102
84.6k
  }
cfl_subsample_hbd_420_8x16_ssse3
Line
Count
Source
99
7.61k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
7.61k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
7.61k
                                               output_q3, width, height); \
102
7.61k
  }
cfl_subsample_hbd_420_16x8_ssse3
Line
Count
Source
99
17.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
17.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
17.7k
                                               output_q3, width, height); \
102
17.7k
  }
cfl_subsample_hbd_420_16x32_ssse3
Line
Count
Source
99
2.84k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
2.84k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
2.84k
                                               output_q3, width, height); \
102
2.84k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x16_ssse3
cfl_subsample_hbd_420_4x16_ssse3
Line
Count
Source
99
65.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
65.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
65.8k
                                               output_q3, width, height); \
102
65.8k
  }
cfl_subsample_hbd_420_16x4_ssse3
Line
Count
Source
99
86.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
86.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
86.1k
                                               output_q3, width, height); \
102
86.1k
  }
cfl_subsample_hbd_420_8x32_ssse3
Line
Count
Source
99
5.06k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
5.06k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
5.06k
                                               output_q3, width, height); \
102
5.06k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x8_ssse3
cfl_subsample_hbd_422_4x4_ssse3
Line
Count
Source
99
1.63k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
1.63k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
1.63k
                                               output_q3, width, height); \
102
1.63k
  }
cfl_subsample_hbd_422_8x8_ssse3
Line
Count
Source
99
285
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
285
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
285
                                               output_q3, width, height); \
102
285
  }
cfl_subsample_hbd_422_16x16_ssse3
Line
Count
Source
99
34
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
34
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
34
                                               output_q3, width, height); \
102
34
  }
Unexecuted instantiation: cfl_subsample_hbd_422_32x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_4x8_ssse3
cfl_subsample_hbd_422_8x4_ssse3
Line
Count
Source
99
56
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
56
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
56
                                               output_q3, width, height); \
102
56
  }
Unexecuted instantiation: cfl_subsample_hbd_422_8x16_ssse3
cfl_subsample_hbd_422_16x8_ssse3
Line
Count
Source
99
174
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
174
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
174
                                               output_q3, width, height); \
102
174
  }
Unexecuted instantiation: cfl_subsample_hbd_422_16x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_32x16_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_4x16_ssse3
cfl_subsample_hbd_422_16x4_ssse3
Line
Count
Source
99
16
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
16
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
16
                                               output_q3, width, height); \
102
16
  }
Unexecuted instantiation: cfl_subsample_hbd_422_8x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_32x8_ssse3
cfl_subsample_hbd_444_4x4_ssse3
Line
Count
Source
99
124k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
124k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
124k
                                               output_q3, width, height); \
102
124k
  }
cfl_subsample_hbd_444_8x8_ssse3
Line
Count
Source
99
179k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
179k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
179k
                                               output_q3, width, height); \
102
179k
  }
cfl_subsample_hbd_444_16x16_ssse3
Line
Count
Source
99
42.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
42.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
42.6k
                                               output_q3, width, height); \
102
42.6k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x32_ssse3
cfl_subsample_hbd_444_4x8_ssse3
Line
Count
Source
99
35.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
35.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
35.7k
                                               output_q3, width, height); \
102
35.7k
  }
cfl_subsample_hbd_444_8x4_ssse3
Line
Count
Source
99
62.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
62.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
62.5k
                                               output_q3, width, height); \
102
62.5k
  }
cfl_subsample_hbd_444_8x16_ssse3
Line
Count
Source
99
43.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
43.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
43.4k
                                               output_q3, width, height); \
102
43.4k
  }
cfl_subsample_hbd_444_16x8_ssse3
Line
Count
Source
99
48.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
48.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
48.3k
                                               output_q3, width, height); \
102
48.3k
  }
cfl_subsample_hbd_444_16x32_ssse3
Line
Count
Source
99
6.67k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
6.67k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
6.67k
                                               output_q3, width, height); \
102
6.67k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x16_ssse3
cfl_subsample_hbd_444_4x16_ssse3
Line
Count
Source
99
31.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
31.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
31.4k
                                               output_q3, width, height); \
102
31.4k
  }
cfl_subsample_hbd_444_16x4_ssse3
Line
Count
Source
99
37.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
37.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
37.3k
                                               output_q3, width, height); \
102
37.3k
  }
cfl_subsample_hbd_444_8x32_ssse3
Line
Count
Source
99
15.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
15.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
15.5k
                                               output_q3, width, height); \
102
15.5k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x8_ssse3
cfl_subsample_lbd_420_32x32_avx2
Line
Count
Source
99
28.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
28.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
28.7k
                                               output_q3, width, height); \
102
28.7k
  }
cfl_subsample_lbd_420_32x16_avx2
Line
Count
Source
99
8.76k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
8.76k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
8.76k
                                               output_q3, width, height); \
102
8.76k
  }
cfl_subsample_lbd_420_32x8_avx2
Line
Count
Source
99
12.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
12.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
12.6k
                                               output_q3, width, height); \
102
12.6k
  }
cfl_subsample_lbd_422_32x32_avx2
Line
Count
Source
99
888
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
888
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
888
                                               output_q3, width, height); \
102
888
  }
cfl_subsample_lbd_422_32x16_avx2
Line
Count
Source
99
352
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
352
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
352
                                               output_q3, width, height); \
102
352
  }
cfl_subsample_lbd_422_32x8_avx2
Line
Count
Source
99
512
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
512
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
512
                                               output_q3, width, height); \
102
512
  }
cfl_subsample_lbd_444_32x32_avx2
Line
Count
Source
99
11.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
11.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
11.8k
                                               output_q3, width, height); \
102
11.8k
  }
cfl_subsample_lbd_444_32x16_avx2
Line
Count
Source
99
6.93k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
6.93k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
6.93k
                                               output_q3, width, height); \
102
6.93k
  }
cfl_subsample_lbd_444_32x8_avx2
Line
Count
Source
99
9.09k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
9.09k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
9.09k
                                               output_q3, width, height); \
102
9.09k
  }
cfl_subsample_hbd_420_32x32_avx2
Line
Count
Source
99
9.46k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
9.46k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
9.46k
                                               output_q3, width, height); \
102
9.46k
  }
cfl_subsample_hbd_420_32x16_avx2
Line
Count
Source
99
3.82k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
3.82k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
3.82k
                                               output_q3, width, height); \
102
3.82k
  }
cfl_subsample_hbd_420_32x8_avx2
Line
Count
Source
99
7.27k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
7.27k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
7.27k
                                               output_q3, width, height); \
102
7.27k
  }
cfl_subsample_hbd_422_32x32_avx2
Line
Count
Source
99
26
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
26
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
26
                                               output_q3, width, height); \
102
26
  }
cfl_subsample_hbd_422_32x16_avx2
Line
Count
Source
99
80
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
80
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
80
                                               output_q3, width, height); \
102
80
  }
cfl_subsample_hbd_422_32x8_avx2
Line
Count
Source
99
13
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
13
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
13
                                               output_q3, width, height); \
102
13
  }
cfl_subsample_hbd_444_32x32_avx2
Line
Count
Source
99
19.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
19.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
19.2k
                                               output_q3, width, height); \
102
19.2k
  }
cfl_subsample_hbd_444_32x16_avx2
Line
Count
Source
99
8.63k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
8.63k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
8.63k
                                               output_q3, width, height); \
102
8.63k
  }
cfl_subsample_hbd_444_32x8_avx2
Line
Count
Source
99
30.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
100
30.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
101
30.2k
                                               output_q3, width, height); \
102
30.2k
  }
103
104
// Declare size-specific wrappers for all valid CfL sizes.
105
#define CFL_SUBSAMPLE_FUNCTIONS(arch, sub, bd)                            \
106
  CFL_SUBSAMPLE(arch, sub, bd, 4, 4)                                      \
107
  CFL_SUBSAMPLE(arch, sub, bd, 8, 8)                                      \
108
  CFL_SUBSAMPLE(arch, sub, bd, 16, 16)                                    \
109
  CFL_SUBSAMPLE(arch, sub, bd, 32, 32)                                    \
110
  CFL_SUBSAMPLE(arch, sub, bd, 4, 8)                                      \
111
  CFL_SUBSAMPLE(arch, sub, bd, 8, 4)                                      \
112
  CFL_SUBSAMPLE(arch, sub, bd, 8, 16)                                     \
113
  CFL_SUBSAMPLE(arch, sub, bd, 16, 8)                                     \
114
  CFL_SUBSAMPLE(arch, sub, bd, 16, 32)                                    \
115
  CFL_SUBSAMPLE(arch, sub, bd, 32, 16)                                    \
116
  CFL_SUBSAMPLE(arch, sub, bd, 4, 16)                                     \
117
  CFL_SUBSAMPLE(arch, sub, bd, 16, 4)                                     \
118
  CFL_SUBSAMPLE(arch, sub, bd, 8, 32)                                     \
119
  CFL_SUBSAMPLE(arch, sub, bd, 32, 8)                                     \
120
  cfl_subsample_##bd##_fn cfl_get_luma_subsampling_##sub##_##bd##_##arch( \
121
0
      TX_SIZE tx_size) {                                                  \
122
0
    CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
123
0
    return subfn_##sub[tx_size];                                          \
124
0
  }
Unexecuted instantiation: cfl_get_luma_subsampling_420_lbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_422_lbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_444_lbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_420_hbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_422_hbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_444_hbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_420_lbd_ssse3
Unexecuted instantiation: cfl_get_luma_subsampling_422_lbd_ssse3
Unexecuted instantiation: cfl_get_luma_subsampling_444_lbd_ssse3
Unexecuted instantiation: cfl_get_luma_subsampling_420_hbd_ssse3
Unexecuted instantiation: cfl_get_luma_subsampling_422_hbd_ssse3
Unexecuted instantiation: cfl_get_luma_subsampling_444_hbd_ssse3
125
126
// Declare an architecture-specific array of function pointers for size-specific
127
// wrappers.
128
#define CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
129
0
  static const cfl_subsample_##bd##_fn subfn_##sub[TX_SIZES_ALL] = {          \
130
0
    cfl_subsample_##bd##_##sub##_4x4_##arch,   /* 4x4 */                      \
131
0
    cfl_subsample_##bd##_##sub##_8x8_##arch,   /* 8x8 */                      \
132
0
    cfl_subsample_##bd##_##sub##_16x16_##arch, /* 16x16 */                    \
133
0
    cfl_subsample_##bd##_##sub##_32x32_##arch, /* 32x32 */                    \
134
0
    NULL,                                      /* 64x64 (invalid CFL size) */ \
135
0
    cfl_subsample_##bd##_##sub##_4x8_##arch,   /* 4x8 */                      \
136
0
    cfl_subsample_##bd##_##sub##_8x4_##arch,   /* 8x4 */                      \
137
0
    cfl_subsample_##bd##_##sub##_8x16_##arch,  /* 8x16 */                     \
138
0
    cfl_subsample_##bd##_##sub##_16x8_##arch,  /* 16x8 */                     \
139
0
    cfl_subsample_##bd##_##sub##_16x32_##arch, /* 16x32 */                    \
140
0
    cfl_subsample_##bd##_##sub##_32x16_##arch, /* 32x16 */                    \
141
0
    NULL,                                      /* 32x64 (invalid CFL size) */ \
142
0
    NULL,                                      /* 64x32 (invalid CFL size) */ \
143
0
    cfl_subsample_##bd##_##sub##_4x16_##arch,  /* 4x16  */                    \
144
0
    cfl_subsample_##bd##_##sub##_16x4_##arch,  /* 16x4  */                    \
145
0
    cfl_subsample_##bd##_##sub##_8x32_##arch,  /* 8x32  */                    \
146
0
    cfl_subsample_##bd##_##sub##_32x8_##arch,  /* 32x8  */                    \
147
0
    NULL,                                      /* 16x64 (invalid CFL size) */ \
148
0
    NULL,                                      /* 64x16 (invalid CFL size) */ \
149
0
  };
150
151
// The RTCD script does not support passing in an array, so we wrap it in this
152
// function.
153
#if CONFIG_AV1_HIGHBITDEPTH
154
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
155
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
156
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
157
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd) \
158
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, hbd) \
159
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, hbd) \
160
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, hbd)
161
#else
162
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
163
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
164
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
165
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd)
166
#endif
167
168
// Declare a size-specific wrapper for the size-generic function. The compiler
169
// will inline the size generic function in here, the advantage is that the size
170
// will be constant allowing for loop unrolling and other constant propagated
171
// goodness.
172
#define CFL_SUB_AVG_X(arch, width, height, round_offset, num_pel_log2)       \
173
  void cfl_subtract_average_##width##x##height##_##arch(const uint16_t *src, \
174
1.30M
                                                        int16_t *dst) {      \
175
1.30M
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
1.30M
                            num_pel_log2);                                   \
177
1.30M
  }
Unexecuted instantiation: cfl_subtract_average_4x4_c
Unexecuted instantiation: cfl_subtract_average_4x8_c
Unexecuted instantiation: cfl_subtract_average_4x16_c
Unexecuted instantiation: cfl_subtract_average_8x4_c
Unexecuted instantiation: cfl_subtract_average_8x8_c
Unexecuted instantiation: cfl_subtract_average_8x16_c
Unexecuted instantiation: cfl_subtract_average_8x32_c
Unexecuted instantiation: cfl_subtract_average_16x4_c
Unexecuted instantiation: cfl_subtract_average_16x8_c
Unexecuted instantiation: cfl_subtract_average_16x16_c
Unexecuted instantiation: cfl_subtract_average_16x32_c
Unexecuted instantiation: cfl_subtract_average_32x8_c
Unexecuted instantiation: cfl_subtract_average_32x16_c
Unexecuted instantiation: cfl_subtract_average_32x32_c
cfl_subtract_average_4x4_sse2
Line
Count
Source
174
230k
                                                        int16_t *dst) {      \
175
230k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
230k
                            num_pel_log2);                                   \
177
230k
  }
cfl_subtract_average_4x8_sse2
Line
Count
Source
174
90.9k
                                                        int16_t *dst) {      \
175
90.9k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
90.9k
                            num_pel_log2);                                   \
177
90.9k
  }
cfl_subtract_average_4x16_sse2
Line
Count
Source
174
105k
                                                        int16_t *dst) {      \
175
105k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
105k
                            num_pel_log2);                                   \
177
105k
  }
cfl_subtract_average_8x4_sse2
Line
Count
Source
174
154k
                                                        int16_t *dst) {      \
175
154k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
154k
                            num_pel_log2);                                   \
177
154k
  }
cfl_subtract_average_8x8_sse2
Line
Count
Source
174
186k
                                                        int16_t *dst) {      \
175
186k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
186k
                            num_pel_log2);                                   \
177
186k
  }
cfl_subtract_average_8x16_sse2
Line
Count
Source
174
69.6k
                                                        int16_t *dst) {      \
175
69.6k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
69.6k
                            num_pel_log2);                                   \
177
69.6k
  }
cfl_subtract_average_8x32_sse2
Line
Count
Source
174
38.5k
                                                        int16_t *dst) {      \
175
38.5k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
38.5k
                            num_pel_log2);                                   \
177
38.5k
  }
Unexecuted instantiation: cfl_subtract_average_16x4_sse2
Unexecuted instantiation: cfl_subtract_average_16x8_sse2
Unexecuted instantiation: cfl_subtract_average_16x16_sse2
Unexecuted instantiation: cfl_subtract_average_16x32_sse2
Unexecuted instantiation: cfl_subtract_average_32x8_sse2
Unexecuted instantiation: cfl_subtract_average_32x16_sse2
Unexecuted instantiation: cfl_subtract_average_32x32_sse2
cfl_subtract_average_16x4_avx2
Line
Count
Source
174
109k
                                                        int16_t *dst) {      \
175
109k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
109k
                            num_pel_log2);                                   \
177
109k
  }
cfl_subtract_average_16x8_avx2
Line
Count
Source
174
88.3k
                                                        int16_t *dst) {      \
175
88.3k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
88.3k
                            num_pel_log2);                                   \
177
88.3k
  }
cfl_subtract_average_16x16_avx2
Line
Count
Source
174
123k
                                                        int16_t *dst) {      \
175
123k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
123k
                            num_pel_log2);                                   \
177
123k
  }
cfl_subtract_average_16x32_avx2
Line
Count
Source
174
18.0k
                                                        int16_t *dst) {      \
175
18.0k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
18.0k
                            num_pel_log2);                                   \
177
18.0k
  }
cfl_subtract_average_32x8_avx2
Line
Count
Source
174
40.5k
                                                        int16_t *dst) {      \
175
40.5k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
40.5k
                            num_pel_log2);                                   \
177
40.5k
  }
cfl_subtract_average_32x16_avx2
Line
Count
Source
174
15.8k
                                                        int16_t *dst) {      \
175
15.8k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
15.8k
                            num_pel_log2);                                   \
177
15.8k
  }
cfl_subtract_average_32x32_avx2
Line
Count
Source
174
32.1k
                                                        int16_t *dst) {      \
175
32.1k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
176
32.1k
                            num_pel_log2);                                   \
177
32.1k
  }
178
179
// Declare size-specific wrappers for all valid CfL sizes.
180
#define CFL_SUB_AVG_FN(arch)                                              \
181
  CFL_SUB_AVG_X(arch, 4, 4, 8, 4)                                         \
182
  CFL_SUB_AVG_X(arch, 4, 8, 16, 5)                                        \
183
  CFL_SUB_AVG_X(arch, 4, 16, 32, 6)                                       \
184
  CFL_SUB_AVG_X(arch, 8, 4, 16, 5)                                        \
185
  CFL_SUB_AVG_X(arch, 8, 8, 32, 6)                                        \
186
  CFL_SUB_AVG_X(arch, 8, 16, 64, 7)                                       \
187
  CFL_SUB_AVG_X(arch, 8, 32, 128, 8)                                      \
188
  CFL_SUB_AVG_X(arch, 16, 4, 32, 6)                                       \
189
  CFL_SUB_AVG_X(arch, 16, 8, 64, 7)                                       \
190
  CFL_SUB_AVG_X(arch, 16, 16, 128, 8)                                     \
191
  CFL_SUB_AVG_X(arch, 16, 32, 256, 9)                                     \
192
  CFL_SUB_AVG_X(arch, 32, 8, 128, 8)                                      \
193
  CFL_SUB_AVG_X(arch, 32, 16, 256, 9)                                     \
194
  CFL_SUB_AVG_X(arch, 32, 32, 512, 10)                                    \
195
  cfl_subtract_average_fn cfl_get_subtract_average_fn_##arch(             \
196
0
      TX_SIZE tx_size) {                                                  \
197
0
    static const cfl_subtract_average_fn sub_avg[TX_SIZES_ALL] = {        \
198
0
      cfl_subtract_average_4x4_##arch,   /* 4x4 */                        \
199
0
      cfl_subtract_average_8x8_##arch,   /* 8x8 */                        \
200
0
      cfl_subtract_average_16x16_##arch, /* 16x16 */                      \
201
0
      cfl_subtract_average_32x32_##arch, /* 32x32 */                      \
202
0
      NULL,                              /* 64x64 (invalid CFL size) */   \
203
0
      cfl_subtract_average_4x8_##arch,   /* 4x8 */                        \
204
0
      cfl_subtract_average_8x4_##arch,   /* 8x4 */                        \
205
0
      cfl_subtract_average_8x16_##arch,  /* 8x16 */                       \
206
0
      cfl_subtract_average_16x8_##arch,  /* 16x8 */                       \
207
0
      cfl_subtract_average_16x32_##arch, /* 16x32 */                      \
208
0
      cfl_subtract_average_32x16_##arch, /* 32x16 */                      \
209
0
      NULL,                              /* 32x64 (invalid CFL size) */   \
210
0
      NULL,                              /* 64x32 (invalid CFL size) */   \
211
0
      cfl_subtract_average_4x16_##arch,  /* 4x16 (invalid CFL size) */    \
212
0
      cfl_subtract_average_16x4_##arch,  /* 16x4 (invalid CFL size) */    \
213
0
      cfl_subtract_average_8x32_##arch,  /* 8x32 (invalid CFL size) */    \
214
0
      cfl_subtract_average_32x8_##arch,  /* 32x8 (invalid CFL size) */    \
215
0
      NULL,                              /* 16x64 (invalid CFL size) */   \
216
0
      NULL,                              /* 64x16 (invalid CFL size) */   \
217
0
    };                                                                    \
218
0
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */ \
219
0
    /* index the function pointer array out of bounds. */                 \
220
0
    return sub_avg[tx_size % TX_SIZES_ALL];                               \
221
0
  }
Unexecuted instantiation: cfl_get_subtract_average_fn_c
Unexecuted instantiation: cfl_get_subtract_average_fn_sse2
222
223
// For VSX SIMD optimization, the C versions of width == 4 subtract are
224
// faster than the VSX. As such, the VSX code calls the C versions.
225
void cfl_subtract_average_4x4_c(const uint16_t *src, int16_t *dst);
226
void cfl_subtract_average_4x8_c(const uint16_t *src, int16_t *dst);
227
void cfl_subtract_average_4x16_c(const uint16_t *src, int16_t *dst);
228
229
#define CFL_PREDICT_lbd(arch, width, height)                              \
230
  void cfl_predict_lbd_##width##x##height##_##arch(                       \
231
      const int16_t *pred_buf_q3, uint8_t *dst, int dst_stride,           \
232
1.33M
      int alpha_q3) {                                                     \
233
1.33M
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
1.33M
                           height);                                       \
235
1.33M
  }
Unexecuted instantiation: cfl_predict_lbd_4x4_c
Unexecuted instantiation: cfl_predict_lbd_4x8_c
Unexecuted instantiation: cfl_predict_lbd_4x16_c
Unexecuted instantiation: cfl_predict_lbd_8x4_c
Unexecuted instantiation: cfl_predict_lbd_8x8_c
Unexecuted instantiation: cfl_predict_lbd_8x16_c
Unexecuted instantiation: cfl_predict_lbd_8x32_c
Unexecuted instantiation: cfl_predict_lbd_16x4_c
Unexecuted instantiation: cfl_predict_lbd_16x8_c
Unexecuted instantiation: cfl_predict_lbd_16x16_c
Unexecuted instantiation: cfl_predict_lbd_16x32_c
Unexecuted instantiation: cfl_predict_lbd_32x8_c
Unexecuted instantiation: cfl_predict_lbd_32x16_c
Unexecuted instantiation: cfl_predict_lbd_32x32_c
cfl_predict_lbd_4x4_ssse3
Line
Count
Source
232
300k
      int alpha_q3) {                                                     \
233
300k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
300k
                           height);                                       \
235
300k
  }
cfl_predict_lbd_4x8_ssse3
Line
Count
Source
232
115k
      int alpha_q3) {                                                     \
233
115k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
115k
                           height);                                       \
235
115k
  }
cfl_predict_lbd_4x16_ssse3
Line
Count
Source
232
115k
      int alpha_q3) {                                                     \
233
115k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
115k
                           height);                                       \
235
115k
  }
cfl_predict_lbd_8x4_ssse3
Line
Count
Source
232
169k
      int alpha_q3) {                                                     \
233
169k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
169k
                           height);                                       \
235
169k
  }
cfl_predict_lbd_8x8_ssse3
Line
Count
Source
232
185k
      int alpha_q3) {                                                     \
233
185k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
185k
                           height);                                       \
235
185k
  }
cfl_predict_lbd_8x16_ssse3
Line
Count
Source
232
50.3k
      int alpha_q3) {                                                     \
233
50.3k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
50.3k
                           height);                                       \
235
50.3k
  }
cfl_predict_lbd_8x32_ssse3
Line
Count
Source
232
31.9k
      int alpha_q3) {                                                     \
233
31.9k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
31.9k
                           height);                                       \
235
31.9k
  }
cfl_predict_lbd_16x4_ssse3
Line
Count
Source
232
105k
      int alpha_q3) {                                                     \
233
105k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
105k
                           height);                                       \
235
105k
  }
cfl_predict_lbd_16x8_ssse3
Line
Count
Source
232
67.5k
      int alpha_q3) {                                                     \
233
67.5k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
67.5k
                           height);                                       \
235
67.5k
  }
cfl_predict_lbd_16x16_ssse3
Line
Count
Source
232
119k
      int alpha_q3) {                                                     \
233
119k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
119k
                           height);                                       \
235
119k
  }
cfl_predict_lbd_16x32_ssse3
Line
Count
Source
232
17.4k
      int alpha_q3) {                                                     \
233
17.4k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
17.4k
                           height);                                       \
235
17.4k
  }
Unexecuted instantiation: cfl_predict_lbd_32x8_ssse3
Unexecuted instantiation: cfl_predict_lbd_32x16_ssse3
Unexecuted instantiation: cfl_predict_lbd_32x32_ssse3
cfl_predict_lbd_32x8_avx2
Line
Count
Source
232
18.3k
      int alpha_q3) {                                                     \
233
18.3k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
18.3k
                           height);                                       \
235
18.3k
  }
cfl_predict_lbd_32x16_avx2
Line
Count
Source
232
13.9k
      int alpha_q3) {                                                     \
233
13.9k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
13.9k
                           height);                                       \
235
13.9k
  }
cfl_predict_lbd_32x32_avx2
Line
Count
Source
232
23.9k
      int alpha_q3) {                                                     \
233
23.9k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
234
23.9k
                           height);                                       \
235
23.9k
  }
236
237
#if CONFIG_AV1_HIGHBITDEPTH
238
#define CFL_PREDICT_hbd(arch, width, height)                                   \
239
  void cfl_predict_hbd_##width##x##height##_##arch(                            \
240
      const int16_t *pred_buf_q3, uint16_t *dst, int dst_stride, int alpha_q3, \
241
1.27M
      int bd) {                                                                \
242
1.27M
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
1.27M
                           height);                                            \
244
1.27M
  }
Unexecuted instantiation: cfl_predict_hbd_4x4_c
Unexecuted instantiation: cfl_predict_hbd_4x8_c
Unexecuted instantiation: cfl_predict_hbd_4x16_c
Unexecuted instantiation: cfl_predict_hbd_8x4_c
Unexecuted instantiation: cfl_predict_hbd_8x8_c
Unexecuted instantiation: cfl_predict_hbd_8x16_c
Unexecuted instantiation: cfl_predict_hbd_8x32_c
Unexecuted instantiation: cfl_predict_hbd_16x4_c
Unexecuted instantiation: cfl_predict_hbd_16x8_c
Unexecuted instantiation: cfl_predict_hbd_16x16_c
Unexecuted instantiation: cfl_predict_hbd_16x32_c
Unexecuted instantiation: cfl_predict_hbd_32x8_c
Unexecuted instantiation: cfl_predict_hbd_32x16_c
Unexecuted instantiation: cfl_predict_hbd_32x32_c
cfl_predict_hbd_4x4_ssse3
Line
Count
Source
241
161k
      int bd) {                                                                \
242
161k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
161k
                           height);                                            \
244
161k
  }
cfl_predict_hbd_4x8_ssse3
Line
Count
Source
241
66.9k
      int bd) {                                                                \
242
66.9k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
66.9k
                           height);                                            \
244
66.9k
  }
cfl_predict_hbd_4x16_ssse3
Line
Count
Source
241
95.9k
      int bd) {                                                                \
242
95.9k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
95.9k
                           height);                                            \
244
95.9k
  }
cfl_predict_hbd_8x4_ssse3
Line
Count
Source
241
139k
      int bd) {                                                                \
242
139k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
139k
                           height);                                            \
244
139k
  }
cfl_predict_hbd_8x8_ssse3
Line
Count
Source
241
188k
      int bd) {                                                                \
242
188k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
188k
                           height);                                            \
244
188k
  }
cfl_predict_hbd_8x16_ssse3
Line
Count
Source
241
88.9k
      int bd) {                                                                \
242
88.9k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
88.9k
                           height);                                            \
244
88.9k
  }
cfl_predict_hbd_8x32_ssse3
Line
Count
Source
241
45.1k
      int bd) {                                                                \
242
45.1k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
45.1k
                           height);                                            \
244
45.1k
  }
Unexecuted instantiation: cfl_predict_hbd_16x4_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x8_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x16_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x32_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x8_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x16_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x32_ssse3
cfl_predict_hbd_16x4_avx2
Line
Count
Source
241
113k
      int bd) {                                                                \
242
113k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
113k
                           height);                                            \
244
113k
  }
cfl_predict_hbd_16x8_avx2
Line
Count
Source
241
109k
      int bd) {                                                                \
242
109k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
109k
                           height);                                            \
244
109k
  }
cfl_predict_hbd_16x16_avx2
Line
Count
Source
241
127k
      int bd) {                                                                \
242
127k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
127k
                           height);                                            \
244
127k
  }
cfl_predict_hbd_16x32_avx2
Line
Count
Source
241
18.6k
      int bd) {                                                                \
242
18.6k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
18.6k
                           height);                                            \
244
18.6k
  }
cfl_predict_hbd_32x8_avx2
Line
Count
Source
241
62.6k
      int bd) {                                                                \
242
62.6k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
62.6k
                           height);                                            \
244
62.6k
  }
cfl_predict_hbd_32x16_avx2
Line
Count
Source
241
17.7k
      int bd) {                                                                \
242
17.7k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
17.7k
                           height);                                            \
244
17.7k
  }
cfl_predict_hbd_32x32_avx2
Line
Count
Source
241
40.4k
      int bd) {                                                                \
242
40.4k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
243
40.4k
                           height);                                            \
244
40.4k
  }
245
#endif
246
247
// This wrapper exists because clang format does not like calling macros with
248
// lowercase letters.
249
#define CFL_PREDICT_X(arch, width, height, bd) \
250
  CFL_PREDICT_##bd(arch, width, height)
251
252
#define CFL_PREDICT_FN(arch, bd)                                            \
253
  CFL_PREDICT_X(arch, 4, 4, bd)                                             \
254
  CFL_PREDICT_X(arch, 4, 8, bd)                                             \
255
  CFL_PREDICT_X(arch, 4, 16, bd)                                            \
256
  CFL_PREDICT_X(arch, 8, 4, bd)                                             \
257
  CFL_PREDICT_X(arch, 8, 8, bd)                                             \
258
  CFL_PREDICT_X(arch, 8, 16, bd)                                            \
259
  CFL_PREDICT_X(arch, 8, 32, bd)                                            \
260
  CFL_PREDICT_X(arch, 16, 4, bd)                                            \
261
  CFL_PREDICT_X(arch, 16, 8, bd)                                            \
262
  CFL_PREDICT_X(arch, 16, 16, bd)                                           \
263
  CFL_PREDICT_X(arch, 16, 32, bd)                                           \
264
  CFL_PREDICT_X(arch, 32, 8, bd)                                            \
265
  CFL_PREDICT_X(arch, 32, 16, bd)                                           \
266
  CFL_PREDICT_X(arch, 32, 32, bd)                                           \
267
0
  cfl_predict_##bd##_fn cfl_get_predict_##bd##_fn_##arch(TX_SIZE tx_size) { \
268
0
    static const cfl_predict_##bd##_fn pred[TX_SIZES_ALL] = {               \
269
0
      cfl_predict_##bd##_4x4_##arch,   /* 4x4 */                            \
270
0
      cfl_predict_##bd##_8x8_##arch,   /* 8x8 */                            \
271
0
      cfl_predict_##bd##_16x16_##arch, /* 16x16 */                          \
272
0
      cfl_predict_##bd##_32x32_##arch, /* 32x32 */                          \
273
0
      NULL,                            /* 64x64 (invalid CFL size) */       \
274
0
      cfl_predict_##bd##_4x8_##arch,   /* 4x8 */                            \
275
0
      cfl_predict_##bd##_8x4_##arch,   /* 8x4 */                            \
276
0
      cfl_predict_##bd##_8x16_##arch,  /* 8x16 */                           \
277
0
      cfl_predict_##bd##_16x8_##arch,  /* 16x8 */                           \
278
0
      cfl_predict_##bd##_16x32_##arch, /* 16x32 */                          \
279
0
      cfl_predict_##bd##_32x16_##arch, /* 32x16 */                          \
280
0
      NULL,                            /* 32x64 (invalid CFL size) */       \
281
0
      NULL,                            /* 64x32 (invalid CFL size) */       \
282
0
      cfl_predict_##bd##_4x16_##arch,  /* 4x16  */                          \
283
0
      cfl_predict_##bd##_16x4_##arch,  /* 16x4  */                          \
284
0
      cfl_predict_##bd##_8x32_##arch,  /* 8x32  */                          \
285
0
      cfl_predict_##bd##_32x8_##arch,  /* 32x8  */                          \
286
0
      NULL,                            /* 16x64 (invalid CFL size) */       \
287
0
      NULL,                            /* 64x16 (invalid CFL size) */       \
288
0
    };                                                                      \
289
0
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */   \
290
0
    /* index the function pointer array out of bounds. */                   \
291
0
    return pred[tx_size % TX_SIZES_ALL];                                    \
292
0
  }
Unexecuted instantiation: cfl_get_predict_lbd_fn_c
Unexecuted instantiation: cfl_get_predict_hbd_fn_c
Unexecuted instantiation: cfl_get_predict_lbd_fn_ssse3
Unexecuted instantiation: cfl_get_predict_hbd_fn_ssse3
293
294
#endif  // AOM_AV1_COMMON_CFL_H_