Coverage Report

Created: 2026-05-16 06:27

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/aom/av1/common/cfl.h
Line
Count
Source
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#ifndef AOM_AV1_COMMON_CFL_H_
13
#define AOM_AV1_COMMON_CFL_H_
14
15
#include "av1/common/av1_common_int.h"
16
#include "av1/common/blockd.h"
17
18
// Can we use CfL for the current block?
19
10.0M
static inline CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
10.0M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
10.0M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
10.0M
  assert(bsize < BLOCK_SIZES_ALL);
23
10.0M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
48.6k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
48.6k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
48.6k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
48.6k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
48.6k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
10.0M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
9.31M
                            block_size_high[bsize] <= 32);
34
10.0M
}
Unexecuted instantiation: decodeframe.c:is_cfl_allowed
decodemv.c:is_cfl_allowed
Line
Count
Source
19
7.53M
static inline CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
7.53M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
7.53M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
7.53M
  assert(bsize < BLOCK_SIZES_ALL);
23
7.53M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
48.0k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
48.0k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
48.0k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
48.0k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
48.0k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
7.48M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
6.77M
                            block_size_high[bsize] <= 32);
34
7.53M
}
cfl.c:is_cfl_allowed
Line
Count
Source
19
2.53M
static inline CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
2.53M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
2.53M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
2.53M
  assert(bsize < BLOCK_SIZES_ALL);
23
2.53M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
524
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
524
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
524
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
524
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
524
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
2.53M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
2.53M
                            block_size_high[bsize] <= 32);
34
2.53M
}
Unexecuted instantiation: reconintra.c:is_cfl_allowed
Unexecuted instantiation: cfl_sse2.c:is_cfl_allowed
Unexecuted instantiation: cfl_ssse3.c:is_cfl_allowed
Unexecuted instantiation: cfl_avx2.c:is_cfl_allowed
35
36
// Do we need to save the luma pixels from the current block,
37
// for a possible future CfL prediction?
38
static inline CFL_ALLOWED_TYPE store_cfl_required(const AV1_COMMON *cm,
39
42.6M
                                                  const MACROBLOCKD *xd) {
40
42.6M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
42.6M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
40.9M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
2.09M
    return CFL_ALLOWED;
51
2.09M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
38.8M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
33.4M
                            mbmi->uv_mode == UV_CFL_PRED);
57
40.9M
}
decodeframe.c:store_cfl_required
Line
Count
Source
39
30.6M
                                                  const MACROBLOCKD *xd) {
40
30.6M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
30.6M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
29.5M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
1.03M
    return CFL_ALLOWED;
51
1.03M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
28.5M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
25.9M
                            mbmi->uv_mode == UV_CFL_PRED);
57
29.5M
}
decodemv.c:store_cfl_required
Line
Count
Source
39
12.0M
                                                  const MACROBLOCKD *xd) {
40
12.0M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
12.0M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
11.3M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
1.05M
    return CFL_ALLOWED;
51
1.05M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
10.3M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
7.53M
                            mbmi->uv_mode == UV_CFL_PRED);
57
11.3M
}
Unexecuted instantiation: cfl.c:store_cfl_required
Unexecuted instantiation: reconintra.c:store_cfl_required
Unexecuted instantiation: cfl_sse2.c:store_cfl_required
Unexecuted instantiation: cfl_ssse3.c:store_cfl_required
Unexecuted instantiation: cfl_avx2.c:store_cfl_required
58
59
0
static inline int get_scaled_luma_q0(int alpha_q3, int16_t pred_buf_q3) {
60
0
  int scaled_luma_q6 = alpha_q3 * pred_buf_q3;
61
0
  return ROUND_POWER_OF_TWO_SIGNED(scaled_luma_q6, 6);
62
0
}
Unexecuted instantiation: decodeframe.c:get_scaled_luma_q0
Unexecuted instantiation: decodemv.c:get_scaled_luma_q0
Unexecuted instantiation: cfl.c:get_scaled_luma_q0
Unexecuted instantiation: reconintra.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_sse2.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_ssse3.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_avx2.c:get_scaled_luma_q0
63
64
2.53M
static inline CFL_PRED_TYPE get_cfl_pred_type(int plane) {
65
2.53M
  assert(plane > 0);
66
2.53M
  return (CFL_PRED_TYPE)(plane - 1);
67
2.53M
}
Unexecuted instantiation: decodeframe.c:get_cfl_pred_type
Unexecuted instantiation: decodemv.c:get_cfl_pred_type
Unexecuted instantiation: cfl.c:get_cfl_pred_type
reconintra.c:get_cfl_pred_type
Line
Count
Source
64
2.53M
static inline CFL_PRED_TYPE get_cfl_pred_type(int plane) {
65
2.53M
  assert(plane > 0);
66
2.53M
  return (CFL_PRED_TYPE)(plane - 1);
67
2.53M
}
Unexecuted instantiation: cfl_sse2.c:get_cfl_pred_type
Unexecuted instantiation: cfl_ssse3.c:get_cfl_pred_type
Unexecuted instantiation: cfl_avx2.c:get_cfl_pred_type
68
69
237k
static inline void clear_cfl_dc_pred_cache_flags(CFL_CTX *cfl) {
70
237k
  cfl->use_dc_pred_cache = false;
71
237k
  cfl->dc_pred_is_cached[CFL_PRED_U] = false;
72
237k
  cfl->dc_pred_is_cached[CFL_PRED_V] = false;
73
237k
}
Unexecuted instantiation: decodeframe.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: decodemv.c:clear_cfl_dc_pred_cache_flags
cfl.c:clear_cfl_dc_pred_cache_flags
Line
Count
Source
69
237k
static inline void clear_cfl_dc_pred_cache_flags(CFL_CTX *cfl) {
70
237k
  cfl->use_dc_pred_cache = false;
71
237k
  cfl->dc_pred_is_cached[CFL_PRED_U] = false;
72
  cfl->dc_pred_is_cached[CFL_PRED_V] = false;
73
237k
}
Unexecuted instantiation: reconintra.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_sse2.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_ssse3.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_avx2.c:clear_cfl_dc_pred_cache_flags
74
75
void av1_cfl_predict_block(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
76
                           TX_SIZE tx_size, int plane);
77
78
void cfl_store_block(MACROBLOCKD *const xd, BLOCK_SIZE bsize, TX_SIZE tx_size);
79
80
void cfl_store_tx(MACROBLOCKD *const xd, int row, int col, TX_SIZE tx_size,
81
                  BLOCK_SIZE bsize);
82
83
void cfl_store_dc_pred(MACROBLOCKD *const xd, const uint8_t *input,
84
                       CFL_PRED_TYPE pred_plane, int width);
85
86
void cfl_load_dc_pred(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
87
                      TX_SIZE tx_size, CFL_PRED_TYPE pred_plane);
88
89
// Allows the CFL_SUBSAMPLE function to switch types depending on the bitdepth.
90
#define CFL_lbd_TYPE uint8_t *cfl_type
91
#define CFL_hbd_TYPE uint16_t *cfl_type
92
93
// Declare a size-specific wrapper for the size-generic function. The compiler
94
// will inline the size generic function in here, the advantage is that the size
95
// will be constant allowing for loop unrolling and other constant propagated
96
// goodness.
97
#define CFL_SUBSAMPLE(arch, sub, bd, width, height)                       \
98
  void cfl_subsample_##bd##_##sub##_##width##x##height##_##arch(          \
99
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3);      \
100
  void cfl_subsample_##bd##_##sub##_##width##x##height##_##arch(          \
101
2.40M
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
2.40M
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
2.40M
                                               output_q3, width, height); \
104
2.40M
  }
Unexecuted instantiation: cfl_subsample_lbd_420_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x8_c
cfl_subsample_lbd_420_4x4_ssse3
Line
Count
Source
101
127k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
127k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
127k
                                               output_q3, width, height); \
104
127k
  }
cfl_subsample_lbd_420_8x8_ssse3
Line
Count
Source
101
54.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
54.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
54.5k
                                               output_q3, width, height); \
104
54.5k
  }
cfl_subsample_lbd_420_16x16_ssse3
Line
Count
Source
101
30.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
30.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
30.3k
                                               output_q3, width, height); \
104
30.3k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x32_ssse3
cfl_subsample_lbd_420_4x8_ssse3
Line
Count
Source
101
65.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
65.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
65.4k
                                               output_q3, width, height); \
104
65.4k
  }
cfl_subsample_lbd_420_8x4_ssse3
Line
Count
Source
101
87.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
87.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
87.7k
                                               output_q3, width, height); \
104
87.7k
  }
cfl_subsample_lbd_420_8x16_ssse3
Line
Count
Source
101
17.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
17.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
17.2k
                                               output_q3, width, height); \
104
17.2k
  }
cfl_subsample_lbd_420_16x8_ssse3
Line
Count
Source
101
27.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
27.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
27.7k
                                               output_q3, width, height); \
104
27.7k
  }
cfl_subsample_lbd_420_16x32_ssse3
Line
Count
Source
101
5.56k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
5.56k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
5.56k
                                               output_q3, width, height); \
104
5.56k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x16_ssse3
cfl_subsample_lbd_420_4x16_ssse3
Line
Count
Source
101
80.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
80.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
80.7k
                                               output_q3, width, height); \
104
80.7k
  }
cfl_subsample_lbd_420_16x4_ssse3
Line
Count
Source
101
117k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
117k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
117k
                                               output_q3, width, height); \
104
117k
  }
cfl_subsample_lbd_420_8x32_ssse3
Line
Count
Source
101
7.93k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
7.93k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
7.93k
                                               output_q3, width, height); \
104
7.93k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x8_ssse3
cfl_subsample_lbd_422_4x4_ssse3
Line
Count
Source
101
249
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
249
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
249
                                               output_q3, width, height); \
104
249
  }
cfl_subsample_lbd_422_8x8_ssse3
Line
Count
Source
101
2.30k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
2.30k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
2.30k
                                               output_q3, width, height); \
104
2.30k
  }
cfl_subsample_lbd_422_16x16_ssse3
Line
Count
Source
101
187
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
187
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
187
                                               output_q3, width, height); \
104
187
  }
Unexecuted instantiation: cfl_subsample_lbd_422_32x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_4x8_ssse3
cfl_subsample_lbd_422_8x4_ssse3
Line
Count
Source
101
62
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
62
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
62
                                               output_q3, width, height); \
104
62
  }
Unexecuted instantiation: cfl_subsample_lbd_422_8x16_ssse3
cfl_subsample_lbd_422_16x8_ssse3
Line
Count
Source
101
252
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
252
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
252
                                               output_q3, width, height); \
104
252
  }
Unexecuted instantiation: cfl_subsample_lbd_422_16x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_32x16_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_4x16_ssse3
cfl_subsample_lbd_422_16x4_ssse3
Line
Count
Source
101
355
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
355
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
355
                                               output_q3, width, height); \
104
355
  }
Unexecuted instantiation: cfl_subsample_lbd_422_8x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_32x8_ssse3
cfl_subsample_lbd_444_4x4_ssse3
Line
Count
Source
101
45.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
45.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
45.1k
                                               output_q3, width, height); \
104
45.1k
  }
cfl_subsample_lbd_444_8x8_ssse3
Line
Count
Source
101
59.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
59.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
59.8k
                                               output_q3, width, height); \
104
59.8k
  }
cfl_subsample_lbd_444_16x16_ssse3
Line
Count
Source
101
29.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
29.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
29.5k
                                               output_q3, width, height); \
104
29.5k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x32_ssse3
cfl_subsample_lbd_444_4x8_ssse3
Line
Count
Source
101
10.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
10.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
10.2k
                                               output_q3, width, height); \
104
10.2k
  }
cfl_subsample_lbd_444_8x4_ssse3
Line
Count
Source
101
18.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
18.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
18.7k
                                               output_q3, width, height); \
104
18.7k
  }
cfl_subsample_lbd_444_8x16_ssse3
Line
Count
Source
101
17.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
17.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
17.1k
                                               output_q3, width, height); \
104
17.1k
  }
cfl_subsample_lbd_444_16x8_ssse3
Line
Count
Source
101
25.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
25.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
25.8k
                                               output_q3, width, height); \
104
25.8k
  }
cfl_subsample_lbd_444_16x32_ssse3
Line
Count
Source
101
12.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
12.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
12.7k
                                               output_q3, width, height); \
104
12.7k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x16_ssse3
cfl_subsample_lbd_444_4x16_ssse3
Line
Count
Source
101
112k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
112k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
112k
                                               output_q3, width, height); \
104
112k
  }
cfl_subsample_lbd_444_16x4_ssse3
Line
Count
Source
101
50.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
50.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
50.5k
                                               output_q3, width, height); \
104
50.5k
  }
cfl_subsample_lbd_444_8x32_ssse3
Line
Count
Source
101
14.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
14.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
14.6k
                                               output_q3, width, height); \
104
14.6k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x8_ssse3
cfl_subsample_hbd_420_4x4_ssse3
Line
Count
Source
101
139k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
139k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
139k
                                               output_q3, width, height); \
104
139k
  }
cfl_subsample_hbd_420_8x8_ssse3
Line
Count
Source
101
64.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
64.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
64.7k
                                               output_q3, width, height); \
104
64.7k
  }
cfl_subsample_hbd_420_16x16_ssse3
Line
Count
Source
101
27.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
27.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
27.1k
                                               output_q3, width, height); \
104
27.1k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x32_ssse3
cfl_subsample_hbd_420_4x8_ssse3
Line
Count
Source
101
92.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
92.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
92.7k
                                               output_q3, width, height); \
104
92.7k
  }
cfl_subsample_hbd_420_8x4_ssse3
Line
Count
Source
101
135k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
135k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
135k
                                               output_q3, width, height); \
104
135k
  }
cfl_subsample_hbd_420_8x16_ssse3
Line
Count
Source
101
11.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
11.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
11.4k
                                               output_q3, width, height); \
104
11.4k
  }
cfl_subsample_hbd_420_16x8_ssse3
Line
Count
Source
101
27.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
27.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
27.7k
                                               output_q3, width, height); \
104
27.7k
  }
cfl_subsample_hbd_420_16x32_ssse3
Line
Count
Source
101
4.19k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
4.19k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
4.19k
                                               output_q3, width, height); \
104
4.19k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x16_ssse3
cfl_subsample_hbd_420_4x16_ssse3
Line
Count
Source
101
117k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
117k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
117k
                                               output_q3, width, height); \
104
117k
  }
cfl_subsample_hbd_420_16x4_ssse3
Line
Count
Source
101
162k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
162k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
162k
                                               output_q3, width, height); \
104
162k
  }
cfl_subsample_hbd_420_8x32_ssse3
Line
Count
Source
101
8.63k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
8.63k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
8.63k
                                               output_q3, width, height); \
104
8.63k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x8_ssse3
cfl_subsample_hbd_422_4x4_ssse3
Line
Count
Source
101
1.03k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
1.03k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
1.03k
                                               output_q3, width, height); \
104
1.03k
  }
cfl_subsample_hbd_422_8x8_ssse3
Line
Count
Source
101
97
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
97
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
97
                                               output_q3, width, height); \
104
97
  }
cfl_subsample_hbd_422_16x16_ssse3
Line
Count
Source
101
28
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
28
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
28
                                               output_q3, width, height); \
104
28
  }
Unexecuted instantiation: cfl_subsample_hbd_422_32x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_4x8_ssse3
cfl_subsample_hbd_422_8x4_ssse3
Line
Count
Source
101
294
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
294
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
294
                                               output_q3, width, height); \
104
294
  }
Unexecuted instantiation: cfl_subsample_hbd_422_8x16_ssse3
cfl_subsample_hbd_422_16x8_ssse3
Line
Count
Source
101
225
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
225
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
225
                                               output_q3, width, height); \
104
225
  }
Unexecuted instantiation: cfl_subsample_hbd_422_16x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_32x16_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_4x16_ssse3
cfl_subsample_hbd_422_16x4_ssse3
Line
Count
Source
101
39
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
39
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
39
                                               output_q3, width, height); \
104
39
  }
Unexecuted instantiation: cfl_subsample_hbd_422_8x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_32x8_ssse3
cfl_subsample_hbd_444_4x4_ssse3
Line
Count
Source
101
86.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
86.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
86.2k
                                               output_q3, width, height); \
104
86.2k
  }
cfl_subsample_hbd_444_8x8_ssse3
Line
Count
Source
101
102k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
102k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
102k
                                               output_q3, width, height); \
104
102k
  }
cfl_subsample_hbd_444_16x16_ssse3
Line
Count
Source
101
38.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
38.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
38.8k
                                               output_q3, width, height); \
104
38.8k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x32_ssse3
cfl_subsample_hbd_444_4x8_ssse3
Line
Count
Source
101
22.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
22.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
22.3k
                                               output_q3, width, height); \
104
22.3k
  }
cfl_subsample_hbd_444_8x4_ssse3
Line
Count
Source
101
35.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
35.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
35.0k
                                               output_q3, width, height); \
104
35.0k
  }
cfl_subsample_hbd_444_8x16_ssse3
Line
Count
Source
101
33.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
33.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
33.2k
                                               output_q3, width, height); \
104
33.2k
  }
cfl_subsample_hbd_444_16x8_ssse3
Line
Count
Source
101
42.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
42.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
42.0k
                                               output_q3, width, height); \
104
42.0k
  }
cfl_subsample_hbd_444_16x32_ssse3
Line
Count
Source
101
7.76k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
7.76k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
7.76k
                                               output_q3, width, height); \
104
7.76k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x16_ssse3
cfl_subsample_hbd_444_4x16_ssse3
Line
Count
Source
101
23.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
23.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
23.6k
                                               output_q3, width, height); \
104
23.6k
  }
cfl_subsample_hbd_444_16x4_ssse3
Line
Count
Source
101
40.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
40.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
40.0k
                                               output_q3, width, height); \
104
40.0k
  }
cfl_subsample_hbd_444_8x32_ssse3
Line
Count
Source
101
16.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
16.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
16.4k
                                               output_q3, width, height); \
104
16.4k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x8_ssse3
cfl_subsample_lbd_420_32x32_avx2
Line
Count
Source
101
16.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
16.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
16.5k
                                               output_q3, width, height); \
104
16.5k
  }
cfl_subsample_lbd_420_32x16_avx2
Line
Count
Source
101
5.31k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
5.31k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
5.31k
                                               output_q3, width, height); \
104
5.31k
  }
cfl_subsample_lbd_420_32x8_avx2
Line
Count
Source
101
9.47k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
9.47k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
9.47k
                                               output_q3, width, height); \
104
9.47k
  }
cfl_subsample_lbd_422_32x32_avx2
Line
Count
Source
101
329
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
329
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
329
                                               output_q3, width, height); \
104
329
  }
cfl_subsample_lbd_422_32x16_avx2
Line
Count
Source
101
156
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
156
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
156
                                               output_q3, width, height); \
104
156
  }
cfl_subsample_lbd_422_32x8_avx2
Line
Count
Source
101
352
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
352
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
352
                                               output_q3, width, height); \
104
352
  }
cfl_subsample_lbd_444_32x32_avx2
Line
Count
Source
101
14.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
14.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
14.8k
                                               output_q3, width, height); \
104
14.8k
  }
cfl_subsample_lbd_444_32x16_avx2
Line
Count
Source
101
6.06k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
6.06k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
6.06k
                                               output_q3, width, height); \
104
6.06k
  }
cfl_subsample_lbd_444_32x8_avx2
Line
Count
Source
101
11.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
11.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
11.6k
                                               output_q3, width, height); \
104
11.6k
  }
cfl_subsample_hbd_420_32x32_avx2
Line
Count
Source
101
15.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
15.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
15.0k
                                               output_q3, width, height); \
104
15.0k
  }
cfl_subsample_hbd_420_32x16_avx2
Line
Count
Source
101
5.14k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
5.14k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
5.14k
                                               output_q3, width, height); \
104
5.14k
  }
cfl_subsample_hbd_420_32x8_avx2
Line
Count
Source
101
8.45k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
8.45k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
8.45k
                                               output_q3, width, height); \
104
8.45k
  }
cfl_subsample_hbd_422_32x32_avx2
Line
Count
Source
101
13
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
13
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
13
                                               output_q3, width, height); \
104
13
  }
cfl_subsample_hbd_422_32x16_avx2
Line
Count
Source
101
119
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
119
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
119
                                               output_q3, width, height); \
104
119
  }
cfl_subsample_hbd_422_32x8_avx2
Line
Count
Source
101
62
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
62
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
62
                                               output_q3, width, height); \
104
62
  }
cfl_subsample_hbd_444_32x32_avx2
Line
Count
Source
101
16.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
16.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
16.6k
                                               output_q3, width, height); \
104
16.6k
  }
cfl_subsample_hbd_444_32x16_avx2
Line
Count
Source
101
12.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
12.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
12.4k
                                               output_q3, width, height); \
104
12.4k
  }
cfl_subsample_hbd_444_32x8_avx2
Line
Count
Source
101
17.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
17.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
17.3k
                                               output_q3, width, height); \
104
17.3k
  }
105
106
// Declare size-specific wrappers for all valid CfL sizes.
107
#define CFL_SUBSAMPLE_FUNCTIONS(arch, sub, bd)                            \
108
  CFL_SUBSAMPLE(arch, sub, bd, 4, 4)                                      \
109
  CFL_SUBSAMPLE(arch, sub, bd, 8, 8)                                      \
110
  CFL_SUBSAMPLE(arch, sub, bd, 16, 16)                                    \
111
  CFL_SUBSAMPLE(arch, sub, bd, 32, 32)                                    \
112
  CFL_SUBSAMPLE(arch, sub, bd, 4, 8)                                      \
113
  CFL_SUBSAMPLE(arch, sub, bd, 8, 4)                                      \
114
  CFL_SUBSAMPLE(arch, sub, bd, 8, 16)                                     \
115
  CFL_SUBSAMPLE(arch, sub, bd, 16, 8)                                     \
116
  CFL_SUBSAMPLE(arch, sub, bd, 16, 32)                                    \
117
  CFL_SUBSAMPLE(arch, sub, bd, 32, 16)                                    \
118
  CFL_SUBSAMPLE(arch, sub, bd, 4, 16)                                     \
119
  CFL_SUBSAMPLE(arch, sub, bd, 16, 4)                                     \
120
  CFL_SUBSAMPLE(arch, sub, bd, 8, 32)                                     \
121
  CFL_SUBSAMPLE(arch, sub, bd, 32, 8)                                     \
122
  cfl_subsample_##bd##_fn cfl_get_luma_subsampling_##sub##_##bd##_##arch( \
123
0
      TX_SIZE tx_size) {                                                  \
124
0
    CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
125
0
    return subfn_##sub[tx_size];                                          \
126
0
  }
127
128
// Declare an architecture-specific array of function pointers for size-specific
129
// wrappers.
130
#define CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
131
0
  static const cfl_subsample_##bd##_fn subfn_##sub[TX_SIZES_ALL] = {          \
132
0
    cfl_subsample_##bd##_##sub##_4x4_##arch,   /* 4x4 */                      \
133
0
    cfl_subsample_##bd##_##sub##_8x8_##arch,   /* 8x8 */                      \
134
0
    cfl_subsample_##bd##_##sub##_16x16_##arch, /* 16x16 */                    \
135
0
    cfl_subsample_##bd##_##sub##_32x32_##arch, /* 32x32 */                    \
136
0
    NULL,                                      /* 64x64 (invalid CFL size) */ \
137
0
    cfl_subsample_##bd##_##sub##_4x8_##arch,   /* 4x8 */                      \
138
0
    cfl_subsample_##bd##_##sub##_8x4_##arch,   /* 8x4 */                      \
139
0
    cfl_subsample_##bd##_##sub##_8x16_##arch,  /* 8x16 */                     \
140
0
    cfl_subsample_##bd##_##sub##_16x8_##arch,  /* 16x8 */                     \
141
0
    cfl_subsample_##bd##_##sub##_16x32_##arch, /* 16x32 */                    \
142
0
    cfl_subsample_##bd##_##sub##_32x16_##arch, /* 32x16 */                    \
143
0
    NULL,                                      /* 32x64 (invalid CFL size) */ \
144
0
    NULL,                                      /* 64x32 (invalid CFL size) */ \
145
0
    cfl_subsample_##bd##_##sub##_4x16_##arch,  /* 4x16  */                    \
146
0
    cfl_subsample_##bd##_##sub##_16x4_##arch,  /* 16x4  */                    \
147
0
    cfl_subsample_##bd##_##sub##_8x32_##arch,  /* 8x32  */                    \
148
0
    cfl_subsample_##bd##_##sub##_32x8_##arch,  /* 32x8  */                    \
149
0
    NULL,                                      /* 16x64 (invalid CFL size) */ \
150
0
    NULL,                                      /* 64x16 (invalid CFL size) */ \
151
0
  };
152
153
// The RTCD script does not support passing in an array, so we wrap it in this
154
// function.
155
#if CONFIG_AV1_HIGHBITDEPTH
156
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
157
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
158
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
159
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd) \
160
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, hbd) \
161
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, hbd) \
162
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, hbd)
163
#else
164
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
165
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
166
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
167
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd)
168
#endif
169
170
// Declare a size-specific wrapper for the size-generic function. The compiler
171
// will inline the size generic function in here, the advantage is that the size
172
// will be constant allowing for loop unrolling and other constant propagated
173
// goodness.
174
#define CFL_SUB_AVG_X(arch, width, height, round_offset, num_pel_log2)       \
175
  void cfl_subtract_average_##width##x##height##_##arch(const uint16_t *src, \
176
                                                        int16_t *dst);       \
177
  void cfl_subtract_average_##width##x##height##_##arch(const uint16_t *src, \
178
1.26M
                                                        int16_t *dst) {      \
179
1.26M
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
1.26M
                            num_pel_log2);                                   \
181
1.26M
  }
Unexecuted instantiation: cfl_subtract_average_4x4_c
Unexecuted instantiation: cfl_subtract_average_4x8_c
Unexecuted instantiation: cfl_subtract_average_4x16_c
Unexecuted instantiation: cfl_subtract_average_8x4_c
Unexecuted instantiation: cfl_subtract_average_8x8_c
Unexecuted instantiation: cfl_subtract_average_8x16_c
Unexecuted instantiation: cfl_subtract_average_8x32_c
Unexecuted instantiation: cfl_subtract_average_16x4_c
Unexecuted instantiation: cfl_subtract_average_16x8_c
Unexecuted instantiation: cfl_subtract_average_16x16_c
Unexecuted instantiation: cfl_subtract_average_16x32_c
Unexecuted instantiation: cfl_subtract_average_32x8_c
Unexecuted instantiation: cfl_subtract_average_32x16_c
Unexecuted instantiation: cfl_subtract_average_32x32_c
cfl_subtract_average_4x4_sse2
Line
Count
Source
178
221k
                                                        int16_t *dst) {      \
179
221k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
221k
                            num_pel_log2);                                   \
181
221k
  }
cfl_subtract_average_4x8_sse2
Line
Count
Source
178
78.1k
                                                        int16_t *dst) {      \
179
78.1k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
78.1k
                            num_pel_log2);                                   \
181
78.1k
  }
cfl_subtract_average_4x16_sse2
Line
Count
Source
178
156k
                                                        int16_t *dst) {      \
179
156k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
156k
                            num_pel_log2);                                   \
181
156k
  }
cfl_subtract_average_8x4_sse2
Line
Count
Source
178
130k
                                                        int16_t *dst) {      \
179
130k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
130k
                            num_pel_log2);                                   \
181
130k
  }
cfl_subtract_average_8x8_sse2
Line
Count
Source
178
189k
                                                        int16_t *dst) {      \
179
189k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
189k
                            num_pel_log2);                                   \
181
189k
  }
cfl_subtract_average_8x16_sse2
Line
Count
Source
178
61.1k
                                                        int16_t *dst) {      \
179
61.1k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
61.1k
                            num_pel_log2);                                   \
181
61.1k
  }
cfl_subtract_average_8x32_sse2
Line
Count
Source
178
33.3k
                                                        int16_t *dst) {      \
179
33.3k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
33.3k
                            num_pel_log2);                                   \
181
33.3k
  }
Unexecuted instantiation: cfl_subtract_average_16x4_sse2
Unexecuted instantiation: cfl_subtract_average_16x8_sse2
Unexecuted instantiation: cfl_subtract_average_16x16_sse2
Unexecuted instantiation: cfl_subtract_average_16x32_sse2
Unexecuted instantiation: cfl_subtract_average_32x8_sse2
Unexecuted instantiation: cfl_subtract_average_32x16_sse2
Unexecuted instantiation: cfl_subtract_average_32x32_sse2
cfl_subtract_average_16x4_avx2
Line
Count
Source
178
112k
                                                        int16_t *dst) {      \
179
112k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
112k
                            num_pel_log2);                                   \
181
112k
  }
cfl_subtract_average_16x8_avx2
Line
Count
Source
178
80.4k
                                                        int16_t *dst) {      \
179
80.4k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
80.4k
                            num_pel_log2);                                   \
181
80.4k
  }
cfl_subtract_average_16x16_avx2
Line
Count
Source
178
104k
                                                        int16_t *dst) {      \
179
104k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
104k
                            num_pel_log2);                                   \
181
104k
  }
cfl_subtract_average_16x32_avx2
Line
Count
Source
178
21.4k
                                                        int16_t *dst) {      \
179
21.4k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
21.4k
                            num_pel_log2);                                   \
181
21.4k
  }
cfl_subtract_average_32x8_avx2
Line
Count
Source
178
29.4k
                                                        int16_t *dst) {      \
179
29.4k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
29.4k
                            num_pel_log2);                                   \
181
29.4k
  }
cfl_subtract_average_32x16_avx2
Line
Count
Source
178
18.7k
                                                        int16_t *dst) {      \
179
18.7k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
18.7k
                            num_pel_log2);                                   \
181
18.7k
  }
cfl_subtract_average_32x32_avx2
Line
Count
Source
178
31.9k
                                                        int16_t *dst) {      \
179
31.9k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
31.9k
                            num_pel_log2);                                   \
181
31.9k
  }
182
183
// Declare size-specific wrappers for all valid CfL sizes.
184
#define CFL_SUB_AVG_FN(arch)                                              \
185
  CFL_SUB_AVG_X(arch, 4, 4, 8, 4)                                         \
186
  CFL_SUB_AVG_X(arch, 4, 8, 16, 5)                                        \
187
  CFL_SUB_AVG_X(arch, 4, 16, 32, 6)                                       \
188
  CFL_SUB_AVG_X(arch, 8, 4, 16, 5)                                        \
189
  CFL_SUB_AVG_X(arch, 8, 8, 32, 6)                                        \
190
  CFL_SUB_AVG_X(arch, 8, 16, 64, 7)                                       \
191
  CFL_SUB_AVG_X(arch, 8, 32, 128, 8)                                      \
192
  CFL_SUB_AVG_X(arch, 16, 4, 32, 6)                                       \
193
  CFL_SUB_AVG_X(arch, 16, 8, 64, 7)                                       \
194
  CFL_SUB_AVG_X(arch, 16, 16, 128, 8)                                     \
195
  CFL_SUB_AVG_X(arch, 16, 32, 256, 9)                                     \
196
  CFL_SUB_AVG_X(arch, 32, 8, 128, 8)                                      \
197
  CFL_SUB_AVG_X(arch, 32, 16, 256, 9)                                     \
198
  CFL_SUB_AVG_X(arch, 32, 32, 512, 10)                                    \
199
  cfl_subtract_average_fn cfl_get_subtract_average_fn_##arch(             \
200
0
      TX_SIZE tx_size) {                                                  \
201
0
    static const cfl_subtract_average_fn sub_avg[TX_SIZES_ALL] = {        \
202
0
      cfl_subtract_average_4x4_##arch,   /* 4x4 */                        \
203
0
      cfl_subtract_average_8x8_##arch,   /* 8x8 */                        \
204
0
      cfl_subtract_average_16x16_##arch, /* 16x16 */                      \
205
0
      cfl_subtract_average_32x32_##arch, /* 32x32 */                      \
206
0
      NULL,                              /* 64x64 (invalid CFL size) */   \
207
0
      cfl_subtract_average_4x8_##arch,   /* 4x8 */                        \
208
0
      cfl_subtract_average_8x4_##arch,   /* 8x4 */                        \
209
0
      cfl_subtract_average_8x16_##arch,  /* 8x16 */                       \
210
0
      cfl_subtract_average_16x8_##arch,  /* 16x8 */                       \
211
0
      cfl_subtract_average_16x32_##arch, /* 16x32 */                      \
212
0
      cfl_subtract_average_32x16_##arch, /* 32x16 */                      \
213
0
      NULL,                              /* 32x64 (invalid CFL size) */   \
214
0
      NULL,                              /* 64x32 (invalid CFL size) */   \
215
0
      cfl_subtract_average_4x16_##arch,  /* 4x16 (invalid CFL size) */    \
216
0
      cfl_subtract_average_16x4_##arch,  /* 16x4 (invalid CFL size) */    \
217
0
      cfl_subtract_average_8x32_##arch,  /* 8x32 (invalid CFL size) */    \
218
0
      cfl_subtract_average_32x8_##arch,  /* 32x8 (invalid CFL size) */    \
219
0
      NULL,                              /* 16x64 (invalid CFL size) */   \
220
0
      NULL,                              /* 64x16 (invalid CFL size) */   \
221
0
    };                                                                    \
222
0
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */ \
223
0
    /* index the function pointer array out of bounds. */                 \
224
0
    return sub_avg[tx_size % TX_SIZES_ALL];                               \
225
0
  }
226
227
#define CFL_PREDICT_lbd(arch, width, height)                                   \
228
  void cfl_predict_lbd_##width##x##height##_##arch(                            \
229
      const int16_t *pred_buf_q3, uint8_t *dst, int dst_stride, int alpha_q3); \
230
  void cfl_predict_lbd_##width##x##height##_##arch(                            \
231
      const int16_t *pred_buf_q3, uint8_t *dst, int dst_stride,                \
232
1.25M
      int alpha_q3) {                                                          \
233
1.25M
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
1.25M
                           height);                                            \
235
1.25M
  }
Unexecuted instantiation: cfl_predict_lbd_4x4_c
Unexecuted instantiation: cfl_predict_lbd_4x8_c
Unexecuted instantiation: cfl_predict_lbd_4x16_c
Unexecuted instantiation: cfl_predict_lbd_8x4_c
Unexecuted instantiation: cfl_predict_lbd_8x8_c
Unexecuted instantiation: cfl_predict_lbd_8x16_c
Unexecuted instantiation: cfl_predict_lbd_8x32_c
Unexecuted instantiation: cfl_predict_lbd_16x4_c
Unexecuted instantiation: cfl_predict_lbd_16x8_c
Unexecuted instantiation: cfl_predict_lbd_16x16_c
Unexecuted instantiation: cfl_predict_lbd_16x32_c
Unexecuted instantiation: cfl_predict_lbd_32x8_c
Unexecuted instantiation: cfl_predict_lbd_32x16_c
Unexecuted instantiation: cfl_predict_lbd_32x32_c
cfl_predict_lbd_4x4_ssse3
Line
Count
Source
232
197k
      int alpha_q3) {                                                          \
233
197k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
197k
                           height);                                            \
235
197k
  }
cfl_predict_lbd_4x8_ssse3
Line
Count
Source
232
75.3k
      int alpha_q3) {                                                          \
233
75.3k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
75.3k
                           height);                                            \
235
75.3k
  }
cfl_predict_lbd_4x16_ssse3
Line
Count
Source
232
242k
      int alpha_q3) {                                                          \
233
242k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
242k
                           height);                                            \
235
242k
  }
cfl_predict_lbd_8x4_ssse3
Line
Count
Source
232
118k
      int alpha_q3) {                                                          \
233
118k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
118k
                           height);                                            \
235
118k
  }
cfl_predict_lbd_8x8_ssse3
Line
Count
Source
232
169k
      int alpha_q3) {                                                          \
233
169k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
169k
                           height);                                            \
235
169k
  }
cfl_predict_lbd_8x16_ssse3
Line
Count
Source
232
46.7k
      int alpha_q3) {                                                          \
233
46.7k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
46.7k
                           height);                                            \
235
46.7k
  }
cfl_predict_lbd_8x32_ssse3
Line
Count
Source
232
30.4k
      int alpha_q3) {                                                          \
233
30.4k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
30.4k
                           height);                                            \
235
30.4k
  }
cfl_predict_lbd_16x4_ssse3
Line
Count
Source
232
120k
      int alpha_q3) {                                                          \
233
120k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
120k
                           height);                                            \
235
120k
  }
cfl_predict_lbd_16x8_ssse3
Line
Count
Source
232
64.4k
      int alpha_q3) {                                                          \
233
64.4k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
64.4k
                           height);                                            \
235
64.4k
  }
cfl_predict_lbd_16x16_ssse3
Line
Count
Source
232
94.4k
      int alpha_q3) {                                                          \
233
94.4k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
94.4k
                           height);                                            \
235
94.4k
  }
cfl_predict_lbd_16x32_ssse3
Line
Count
Source
232
26.3k
      int alpha_q3) {                                                          \
233
26.3k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
26.3k
                           height);                                            \
235
26.3k
  }
Unexecuted instantiation: cfl_predict_lbd_32x8_ssse3
Unexecuted instantiation: cfl_predict_lbd_32x16_ssse3
Unexecuted instantiation: cfl_predict_lbd_32x32_ssse3
cfl_predict_lbd_32x8_avx2
Line
Count
Source
232
23.5k
      int alpha_q3) {                                                          \
233
23.5k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
23.5k
                           height);                                            \
235
23.5k
  }
cfl_predict_lbd_32x16_avx2
Line
Count
Source
232
12.2k
      int alpha_q3) {                                                          \
233
12.2k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
12.2k
                           height);                                            \
235
12.2k
  }
cfl_predict_lbd_32x32_avx2
Line
Count
Source
232
29.9k
      int alpha_q3) {                                                          \
233
29.9k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
29.9k
                           height);                                            \
235
29.9k
  }
236
237
#if CONFIG_AV1_HIGHBITDEPTH
238
#define CFL_PREDICT_hbd(arch, width, height)                                   \
239
  void cfl_predict_hbd_##width##x##height##_##arch(                            \
240
      const int16_t *pred_buf_q3, uint16_t *dst, int dst_stride, int alpha_q3, \
241
      int bd);                                                                 \
242
  void cfl_predict_hbd_##width##x##height##_##arch(                            \
243
      const int16_t *pred_buf_q3, uint16_t *dst, int dst_stride, int alpha_q3, \
244
1.28M
      int bd) {                                                                \
245
1.28M
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
1.28M
                           height);                                            \
247
1.28M
  }
Unexecuted instantiation: cfl_predict_hbd_4x4_c
Unexecuted instantiation: cfl_predict_hbd_4x8_c
Unexecuted instantiation: cfl_predict_hbd_4x16_c
Unexecuted instantiation: cfl_predict_hbd_8x4_c
Unexecuted instantiation: cfl_predict_hbd_8x8_c
Unexecuted instantiation: cfl_predict_hbd_8x16_c
Unexecuted instantiation: cfl_predict_hbd_8x32_c
Unexecuted instantiation: cfl_predict_hbd_16x4_c
Unexecuted instantiation: cfl_predict_hbd_16x8_c
Unexecuted instantiation: cfl_predict_hbd_16x16_c
Unexecuted instantiation: cfl_predict_hbd_16x32_c
Unexecuted instantiation: cfl_predict_hbd_32x8_c
Unexecuted instantiation: cfl_predict_hbd_32x16_c
Unexecuted instantiation: cfl_predict_hbd_32x32_c
cfl_predict_hbd_4x4_ssse3
Line
Count
Source
244
245k
      int bd) {                                                                \
245
245k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
245k
                           height);                                            \
247
245k
  }
cfl_predict_hbd_4x8_ssse3
Line
Count
Source
244
80.8k
      int bd) {                                                                \
245
80.8k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
80.8k
                           height);                                            \
247
80.8k
  }
cfl_predict_hbd_4x16_ssse3
Line
Count
Source
244
70.2k
      int bd) {                                                                \
245
70.2k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
70.2k
                           height);                                            \
247
70.2k
  }
cfl_predict_hbd_8x4_ssse3
Line
Count
Source
244
143k
      int bd) {                                                                \
245
143k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
143k
                           height);                                            \
247
143k
  }
cfl_predict_hbd_8x8_ssse3
Line
Count
Source
244
210k
      int bd) {                                                                \
245
210k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
210k
                           height);                                            \
247
210k
  }
cfl_predict_hbd_8x16_ssse3
Line
Count
Source
244
75.5k
      int bd) {                                                                \
245
75.5k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
75.5k
                           height);                                            \
247
75.5k
  }
cfl_predict_hbd_8x32_ssse3
Line
Count
Source
244
36.1k
      int bd) {                                                                \
245
36.1k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
36.1k
                           height);                                            \
247
36.1k
  }
Unexecuted instantiation: cfl_predict_hbd_16x4_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x8_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x16_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x32_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x8_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x16_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x32_ssse3
cfl_predict_hbd_16x4_avx2
Line
Count
Source
244
103k
      int bd) {                                                                \
245
103k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
103k
                           height);                                            \
247
103k
  }
cfl_predict_hbd_16x8_avx2
Line
Count
Source
244
96.4k
      int bd) {                                                                \
245
96.4k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
96.4k
                           height);                                            \
247
96.4k
  }
cfl_predict_hbd_16x16_avx2
Line
Count
Source
244
114k
      int bd) {                                                                \
245
114k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
114k
                           height);                                            \
247
114k
  }
cfl_predict_hbd_16x32_avx2
Line
Count
Source
244
16.6k
      int bd) {                                                                \
245
16.6k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
16.6k
                           height);                                            \
247
16.6k
  }
cfl_predict_hbd_32x8_avx2
Line
Count
Source
244
35.4k
      int bd) {                                                                \
245
35.4k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
35.4k
                           height);                                            \
247
35.4k
  }
cfl_predict_hbd_32x16_avx2
Line
Count
Source
244
25.3k
      int bd) {                                                                \
245
25.3k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
25.3k
                           height);                                            \
247
25.3k
  }
cfl_predict_hbd_32x32_avx2
Line
Count
Source
244
33.9k
      int bd) {                                                                \
245
33.9k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
33.9k
                           height);                                            \
247
33.9k
  }
248
#endif
249
250
// This wrapper exists because clang format does not like calling macros with
251
// lowercase letters.
252
#define CFL_PREDICT_X(arch, width, height, bd) \
253
  CFL_PREDICT_##bd(arch, width, height)
254
255
#define CFL_PREDICT_FN(arch, bd)                                            \
256
  CFL_PREDICT_X(arch, 4, 4, bd)                                             \
257
  CFL_PREDICT_X(arch, 4, 8, bd)                                             \
258
  CFL_PREDICT_X(arch, 4, 16, bd)                                            \
259
  CFL_PREDICT_X(arch, 8, 4, bd)                                             \
260
  CFL_PREDICT_X(arch, 8, 8, bd)                                             \
261
  CFL_PREDICT_X(arch, 8, 16, bd)                                            \
262
  CFL_PREDICT_X(arch, 8, 32, bd)                                            \
263
  CFL_PREDICT_X(arch, 16, 4, bd)                                            \
264
  CFL_PREDICT_X(arch, 16, 8, bd)                                            \
265
  CFL_PREDICT_X(arch, 16, 16, bd)                                           \
266
  CFL_PREDICT_X(arch, 16, 32, bd)                                           \
267
  CFL_PREDICT_X(arch, 32, 8, bd)                                            \
268
  CFL_PREDICT_X(arch, 32, 16, bd)                                           \
269
  CFL_PREDICT_X(arch, 32, 32, bd)                                           \
270
0
  cfl_predict_##bd##_fn cfl_get_predict_##bd##_fn_##arch(TX_SIZE tx_size) { \
271
0
    static const cfl_predict_##bd##_fn pred[TX_SIZES_ALL] = {               \
272
0
      cfl_predict_##bd##_4x4_##arch,   /* 4x4 */                            \
273
0
      cfl_predict_##bd##_8x8_##arch,   /* 8x8 */                            \
274
0
      cfl_predict_##bd##_16x16_##arch, /* 16x16 */                          \
275
0
      cfl_predict_##bd##_32x32_##arch, /* 32x32 */                          \
276
0
      NULL,                            /* 64x64 (invalid CFL size) */       \
277
0
      cfl_predict_##bd##_4x8_##arch,   /* 4x8 */                            \
278
0
      cfl_predict_##bd##_8x4_##arch,   /* 8x4 */                            \
279
0
      cfl_predict_##bd##_8x16_##arch,  /* 8x16 */                           \
280
0
      cfl_predict_##bd##_16x8_##arch,  /* 16x8 */                           \
281
0
      cfl_predict_##bd##_16x32_##arch, /* 16x32 */                          \
282
0
      cfl_predict_##bd##_32x16_##arch, /* 32x16 */                          \
283
0
      NULL,                            /* 32x64 (invalid CFL size) */       \
284
0
      NULL,                            /* 64x32 (invalid CFL size) */       \
285
0
      cfl_predict_##bd##_4x16_##arch,  /* 4x16  */                          \
286
0
      cfl_predict_##bd##_16x4_##arch,  /* 16x4  */                          \
287
0
      cfl_predict_##bd##_8x32_##arch,  /* 8x32  */                          \
288
0
      cfl_predict_##bd##_32x8_##arch,  /* 32x8  */                          \
289
0
      NULL,                            /* 16x64 (invalid CFL size) */       \
290
0
      NULL,                            /* 64x16 (invalid CFL size) */       \
291
0
    };                                                                      \
292
0
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */   \
293
0
    /* index the function pointer array out of bounds. */                   \
294
0
    return pred[tx_size % TX_SIZES_ALL];                                    \
295
0
  }
296
297
#endif  // AOM_AV1_COMMON_CFL_H_