Coverage Report

Created: 2026-03-08 06:51

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/aom/av1/common/cfl.h
Line
Count
Source
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved.
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#ifndef AOM_AV1_COMMON_CFL_H_
13
#define AOM_AV1_COMMON_CFL_H_
14
15
#include "av1/common/av1_common_int.h"
16
#include "av1/common/blockd.h"
17
18
// Can we use CfL for the current block?
19
11.6M
static inline CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
11.6M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
11.6M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
11.6M
  assert(bsize < BLOCK_SIZES_ALL);
23
11.6M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
48.9k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
48.9k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
48.9k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
48.9k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
48.9k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
11.5M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
10.7M
                            block_size_high[bsize] <= 32);
34
11.6M
}
Unexecuted instantiation: decodeframe.c:is_cfl_allowed
decodemv.c:is_cfl_allowed
Line
Count
Source
19
8.47M
static inline CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
8.47M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
8.47M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
8.47M
  assert(bsize < BLOCK_SIZES_ALL);
23
8.47M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
48.4k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
48.4k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
48.4k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
48.4k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
48.4k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
8.43M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
7.61M
                            block_size_high[bsize] <= 32);
34
8.47M
}
cfl.c:is_cfl_allowed
Line
Count
Source
19
3.12M
static inline CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
3.12M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
3.12M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
3.12M
  assert(bsize < BLOCK_SIZES_ALL);
23
3.12M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
586
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
586
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
586
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
586
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
586
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
3.12M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
3.12M
                            block_size_high[bsize] <= 32);
34
3.12M
}
Unexecuted instantiation: reconintra.c:is_cfl_allowed
Unexecuted instantiation: cfl_sse2.c:is_cfl_allowed
Unexecuted instantiation: cfl_ssse3.c:is_cfl_allowed
Unexecuted instantiation: cfl_avx2.c:is_cfl_allowed
35
36
// Do we need to save the luma pixels from the current block,
37
// for a possible future CfL prediction?
38
static inline CFL_ALLOWED_TYPE store_cfl_required(const AV1_COMMON *cm,
39
47.2M
                                                  const MACROBLOCKD *xd) {
40
47.2M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
47.2M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
45.1M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
2.25M
    return CFL_ALLOWED;
51
2.25M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
42.9M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
36.6M
                            mbmi->uv_mode == UV_CFL_PRED);
57
45.1M
}
decodeframe.c:store_cfl_required
Line
Count
Source
39
33.4M
                                                  const MACROBLOCKD *xd) {
40
33.4M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
33.4M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
32.2M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
1.10M
    return CFL_ALLOWED;
51
1.10M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
31.1M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
28.1M
                            mbmi->uv_mode == UV_CFL_PRED);
57
32.2M
}
decodemv.c:store_cfl_required
Line
Count
Source
39
13.7M
                                                  const MACROBLOCKD *xd) {
40
13.7M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
13.7M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
12.9M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
1.14M
    return CFL_ALLOWED;
51
1.14M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
11.7M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
8.47M
                            mbmi->uv_mode == UV_CFL_PRED);
57
12.9M
}
Unexecuted instantiation: cfl.c:store_cfl_required
Unexecuted instantiation: reconintra.c:store_cfl_required
Unexecuted instantiation: cfl_sse2.c:store_cfl_required
Unexecuted instantiation: cfl_ssse3.c:store_cfl_required
Unexecuted instantiation: cfl_avx2.c:store_cfl_required
58
59
0
static inline int get_scaled_luma_q0(int alpha_q3, int16_t pred_buf_q3) {
60
0
  int scaled_luma_q6 = alpha_q3 * pred_buf_q3;
61
0
  return ROUND_POWER_OF_TWO_SIGNED(scaled_luma_q6, 6);
62
0
}
Unexecuted instantiation: decodeframe.c:get_scaled_luma_q0
Unexecuted instantiation: decodemv.c:get_scaled_luma_q0
Unexecuted instantiation: cfl.c:get_scaled_luma_q0
Unexecuted instantiation: reconintra.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_sse2.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_ssse3.c:get_scaled_luma_q0
Unexecuted instantiation: cfl_avx2.c:get_scaled_luma_q0
63
64
3.12M
static inline CFL_PRED_TYPE get_cfl_pred_type(int plane) {
65
3.12M
  assert(plane > 0);
66
3.12M
  return (CFL_PRED_TYPE)(plane - 1);
67
3.12M
}
Unexecuted instantiation: decodeframe.c:get_cfl_pred_type
Unexecuted instantiation: decodemv.c:get_cfl_pred_type
Unexecuted instantiation: cfl.c:get_cfl_pred_type
reconintra.c:get_cfl_pred_type
Line
Count
Source
64
3.12M
static inline CFL_PRED_TYPE get_cfl_pred_type(int plane) {
65
3.12M
  assert(plane > 0);
66
3.12M
  return (CFL_PRED_TYPE)(plane - 1);
67
3.12M
}
Unexecuted instantiation: cfl_sse2.c:get_cfl_pred_type
Unexecuted instantiation: cfl_ssse3.c:get_cfl_pred_type
Unexecuted instantiation: cfl_avx2.c:get_cfl_pred_type
68
69
268k
static inline void clear_cfl_dc_pred_cache_flags(CFL_CTX *cfl) {
70
268k
  cfl->use_dc_pred_cache = false;
71
268k
  cfl->dc_pred_is_cached[CFL_PRED_U] = false;
72
268k
  cfl->dc_pred_is_cached[CFL_PRED_V] = false;
73
268k
}
Unexecuted instantiation: decodeframe.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: decodemv.c:clear_cfl_dc_pred_cache_flags
cfl.c:clear_cfl_dc_pred_cache_flags
Line
Count
Source
69
268k
static inline void clear_cfl_dc_pred_cache_flags(CFL_CTX *cfl) {
70
268k
  cfl->use_dc_pred_cache = false;
71
268k
  cfl->dc_pred_is_cached[CFL_PRED_U] = false;
72
  cfl->dc_pred_is_cached[CFL_PRED_V] = false;
73
268k
}
Unexecuted instantiation: reconintra.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_sse2.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_ssse3.c:clear_cfl_dc_pred_cache_flags
Unexecuted instantiation: cfl_avx2.c:clear_cfl_dc_pred_cache_flags
74
75
void av1_cfl_predict_block(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
76
                           TX_SIZE tx_size, int plane);
77
78
void cfl_store_block(MACROBLOCKD *const xd, BLOCK_SIZE bsize, TX_SIZE tx_size);
79
80
void cfl_store_tx(MACROBLOCKD *const xd, int row, int col, TX_SIZE tx_size,
81
                  BLOCK_SIZE bsize);
82
83
void cfl_store_dc_pred(MACROBLOCKD *const xd, const uint8_t *input,
84
                       CFL_PRED_TYPE pred_plane, int width);
85
86
void cfl_load_dc_pred(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
87
                      TX_SIZE tx_size, CFL_PRED_TYPE pred_plane);
88
89
// Allows the CFL_SUBSAMPLE function to switch types depending on the bitdepth.
90
#define CFL_lbd_TYPE uint8_t *cfl_type
91
#define CFL_hbd_TYPE uint16_t *cfl_type
92
93
// Declare a size-specific wrapper for the size-generic function. The compiler
94
// will inline the size generic function in here, the advantage is that the size
95
// will be constant allowing for loop unrolling and other constant propagated
96
// goodness.
97
#define CFL_SUBSAMPLE(arch, sub, bd, width, height)                       \
98
  void cfl_subsample_##bd##_##sub##_##width##x##height##_##arch(          \
99
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3);      \
100
  void cfl_subsample_##bd##_##sub##_##width##x##height##_##arch(          \
101
2.74M
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
2.74M
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
2.74M
                                               output_q3, width, height); \
104
2.74M
  }
Unexecuted instantiation: cfl_subsample_lbd_420_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_420_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_420_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_420_32x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_420_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_420_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_420_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x8_c
cfl_subsample_lbd_420_4x4_ssse3
Line
Count
Source
101
157k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
157k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
157k
                                               output_q3, width, height); \
104
157k
  }
cfl_subsample_lbd_420_8x8_ssse3
Line
Count
Source
101
61.9k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
61.9k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
61.9k
                                               output_q3, width, height); \
104
61.9k
  }
cfl_subsample_lbd_420_16x16_ssse3
Line
Count
Source
101
37.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
37.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
37.7k
                                               output_q3, width, height); \
104
37.7k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x32_ssse3
cfl_subsample_lbd_420_4x8_ssse3
Line
Count
Source
101
88.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
88.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
88.4k
                                               output_q3, width, height); \
104
88.4k
  }
cfl_subsample_lbd_420_8x4_ssse3
Line
Count
Source
101
100k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
100k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
100k
                                               output_q3, width, height); \
104
100k
  }
cfl_subsample_lbd_420_8x16_ssse3
Line
Count
Source
101
19.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
19.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
19.6k
                                               output_q3, width, height); \
104
19.6k
  }
cfl_subsample_lbd_420_16x8_ssse3
Line
Count
Source
101
30.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
30.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
30.1k
                                               output_q3, width, height); \
104
30.1k
  }
cfl_subsample_lbd_420_16x32_ssse3
Line
Count
Source
101
6.41k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
6.41k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
6.41k
                                               output_q3, width, height); \
104
6.41k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x16_ssse3
cfl_subsample_lbd_420_4x16_ssse3
Line
Count
Source
101
111k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
111k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
111k
                                               output_q3, width, height); \
104
111k
  }
cfl_subsample_lbd_420_16x4_ssse3
Line
Count
Source
101
146k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
146k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
146k
                                               output_q3, width, height); \
104
146k
  }
cfl_subsample_lbd_420_8x32_ssse3
Line
Count
Source
101
9.20k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
9.20k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
9.20k
                                               output_q3, width, height); \
104
9.20k
  }
Unexecuted instantiation: cfl_subsample_lbd_420_32x8_ssse3
cfl_subsample_lbd_422_4x4_ssse3
Line
Count
Source
101
198
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
198
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
198
                                               output_q3, width, height); \
104
198
  }
cfl_subsample_lbd_422_8x8_ssse3
Line
Count
Source
101
2.80k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
2.80k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
2.80k
                                               output_q3, width, height); \
104
2.80k
  }
cfl_subsample_lbd_422_16x16_ssse3
Line
Count
Source
101
287
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
287
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
287
                                               output_q3, width, height); \
104
287
  }
Unexecuted instantiation: cfl_subsample_lbd_422_32x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_4x8_ssse3
cfl_subsample_lbd_422_8x4_ssse3
Line
Count
Source
101
67
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
67
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
67
                                               output_q3, width, height); \
104
67
  }
Unexecuted instantiation: cfl_subsample_lbd_422_8x16_ssse3
cfl_subsample_lbd_422_16x8_ssse3
Line
Count
Source
101
333
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
333
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
333
                                               output_q3, width, height); \
104
333
  }
Unexecuted instantiation: cfl_subsample_lbd_422_16x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_32x16_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_4x16_ssse3
cfl_subsample_lbd_422_16x4_ssse3
Line
Count
Source
101
487
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
487
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
487
                                               output_q3, width, height); \
104
487
  }
Unexecuted instantiation: cfl_subsample_lbd_422_8x32_ssse3
Unexecuted instantiation: cfl_subsample_lbd_422_32x8_ssse3
cfl_subsample_lbd_444_4x4_ssse3
Line
Count
Source
101
55.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
55.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
55.5k
                                               output_q3, width, height); \
104
55.5k
  }
cfl_subsample_lbd_444_8x8_ssse3
Line
Count
Source
101
75.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
75.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
75.1k
                                               output_q3, width, height); \
104
75.1k
  }
cfl_subsample_lbd_444_16x16_ssse3
Line
Count
Source
101
41.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
41.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
41.3k
                                               output_q3, width, height); \
104
41.3k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x32_ssse3
cfl_subsample_lbd_444_4x8_ssse3
Line
Count
Source
101
15.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
15.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
15.4k
                                               output_q3, width, height); \
104
15.4k
  }
cfl_subsample_lbd_444_8x4_ssse3
Line
Count
Source
101
26.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
26.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
26.3k
                                               output_q3, width, height); \
104
26.3k
  }
cfl_subsample_lbd_444_8x16_ssse3
Line
Count
Source
101
25.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
25.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
25.2k
                                               output_q3, width, height); \
104
25.2k
  }
cfl_subsample_lbd_444_16x8_ssse3
Line
Count
Source
101
38.9k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
38.9k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
38.9k
                                               output_q3, width, height); \
104
38.9k
  }
cfl_subsample_lbd_444_16x32_ssse3
Line
Count
Source
101
21.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
21.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
21.1k
                                               output_q3, width, height); \
104
21.1k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x16_ssse3
cfl_subsample_lbd_444_4x16_ssse3
Line
Count
Source
101
248k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
248k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
248k
                                               output_q3, width, height); \
104
248k
  }
cfl_subsample_lbd_444_16x4_ssse3
Line
Count
Source
101
57.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
57.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
57.3k
                                               output_q3, width, height); \
104
57.3k
  }
cfl_subsample_lbd_444_8x32_ssse3
Line
Count
Source
101
19.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
19.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
19.7k
                                               output_q3, width, height); \
104
19.7k
  }
Unexecuted instantiation: cfl_subsample_lbd_444_32x8_ssse3
cfl_subsample_hbd_420_4x4_ssse3
Line
Count
Source
101
132k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
132k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
132k
                                               output_q3, width, height); \
104
132k
  }
cfl_subsample_hbd_420_8x8_ssse3
Line
Count
Source
101
55.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
55.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
55.1k
                                               output_q3, width, height); \
104
55.1k
  }
cfl_subsample_hbd_420_16x16_ssse3
Line
Count
Source
101
25.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
25.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
25.4k
                                               output_q3, width, height); \
104
25.4k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x32_ssse3
cfl_subsample_hbd_420_4x8_ssse3
Line
Count
Source
101
85.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
85.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
85.5k
                                               output_q3, width, height); \
104
85.5k
  }
cfl_subsample_hbd_420_8x4_ssse3
Line
Count
Source
101
117k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
117k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
117k
                                               output_q3, width, height); \
104
117k
  }
cfl_subsample_hbd_420_8x16_ssse3
Line
Count
Source
101
10.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
10.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
10.2k
                                               output_q3, width, height); \
104
10.2k
  }
cfl_subsample_hbd_420_16x8_ssse3
Line
Count
Source
101
23.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
23.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
23.6k
                                               output_q3, width, height); \
104
23.6k
  }
cfl_subsample_hbd_420_16x32_ssse3
Line
Count
Source
101
4.05k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
4.05k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
4.05k
                                               output_q3, width, height); \
104
4.05k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x16_ssse3
cfl_subsample_hbd_420_4x16_ssse3
Line
Count
Source
101
105k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
105k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
105k
                                               output_q3, width, height); \
104
105k
  }
cfl_subsample_hbd_420_16x4_ssse3
Line
Count
Source
101
159k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
159k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
159k
                                               output_q3, width, height); \
104
159k
  }
cfl_subsample_hbd_420_8x32_ssse3
Line
Count
Source
101
7.06k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
7.06k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
7.06k
                                               output_q3, width, height); \
104
7.06k
  }
Unexecuted instantiation: cfl_subsample_hbd_420_32x8_ssse3
cfl_subsample_hbd_422_4x4_ssse3
Line
Count
Source
101
1.12k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
1.12k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
1.12k
                                               output_q3, width, height); \
104
1.12k
  }
cfl_subsample_hbd_422_8x8_ssse3
Line
Count
Source
101
133
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
133
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
133
                                               output_q3, width, height); \
104
133
  }
cfl_subsample_hbd_422_16x16_ssse3
Line
Count
Source
101
27
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
27
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
27
                                               output_q3, width, height); \
104
27
  }
Unexecuted instantiation: cfl_subsample_hbd_422_32x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_4x8_ssse3
cfl_subsample_hbd_422_8x4_ssse3
Line
Count
Source
101
259
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
259
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
259
                                               output_q3, width, height); \
104
259
  }
Unexecuted instantiation: cfl_subsample_hbd_422_8x16_ssse3
cfl_subsample_hbd_422_16x8_ssse3
Line
Count
Source
101
80
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
80
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
80
                                               output_q3, width, height); \
104
80
  }
Unexecuted instantiation: cfl_subsample_hbd_422_16x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_32x16_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_4x16_ssse3
cfl_subsample_hbd_422_16x4_ssse3
Line
Count
Source
101
42
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
42
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
42
                                               output_q3, width, height); \
104
42
  }
Unexecuted instantiation: cfl_subsample_hbd_422_8x32_ssse3
Unexecuted instantiation: cfl_subsample_hbd_422_32x8_ssse3
cfl_subsample_hbd_444_4x4_ssse3
Line
Count
Source
101
85.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
85.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
85.2k
                                               output_q3, width, height); \
104
85.2k
  }
cfl_subsample_hbd_444_8x8_ssse3
Line
Count
Source
101
94.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
94.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
94.6k
                                               output_q3, width, height); \
104
94.6k
  }
cfl_subsample_hbd_444_16x16_ssse3
Line
Count
Source
101
45.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
45.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
45.3k
                                               output_q3, width, height); \
104
45.3k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x32_ssse3
cfl_subsample_hbd_444_4x8_ssse3
Line
Count
Source
101
23.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
23.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
23.5k
                                               output_q3, width, height); \
104
23.5k
  }
cfl_subsample_hbd_444_8x4_ssse3
Line
Count
Source
101
40.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
40.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
40.8k
                                               output_q3, width, height); \
104
40.8k
  }
cfl_subsample_hbd_444_8x16_ssse3
Line
Count
Source
101
34.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
34.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
34.4k
                                               output_q3, width, height); \
104
34.4k
  }
cfl_subsample_hbd_444_16x8_ssse3
Line
Count
Source
101
46.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
46.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
46.6k
                                               output_q3, width, height); \
104
46.6k
  }
cfl_subsample_hbd_444_16x32_ssse3
Line
Count
Source
101
8.83k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
8.83k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
8.83k
                                               output_q3, width, height); \
104
8.83k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x16_ssse3
cfl_subsample_hbd_444_4x16_ssse3
Line
Count
Source
101
24.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
24.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
24.6k
                                               output_q3, width, height); \
104
24.6k
  }
cfl_subsample_hbd_444_16x4_ssse3
Line
Count
Source
101
40.9k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
40.9k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
40.9k
                                               output_q3, width, height); \
104
40.9k
  }
cfl_subsample_hbd_444_8x32_ssse3
Line
Count
Source
101
14.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
14.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
14.6k
                                               output_q3, width, height); \
104
14.6k
  }
Unexecuted instantiation: cfl_subsample_hbd_444_32x8_ssse3
cfl_subsample_lbd_420_32x32_avx2
Line
Count
Source
101
20.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
20.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
20.0k
                                               output_q3, width, height); \
104
20.0k
  }
cfl_subsample_lbd_420_32x16_avx2
Line
Count
Source
101
6.70k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
6.70k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
6.70k
                                               output_q3, width, height); \
104
6.70k
  }
cfl_subsample_lbd_420_32x8_avx2
Line
Count
Source
101
11.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
11.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
11.0k
                                               output_q3, width, height); \
104
11.0k
  }
cfl_subsample_lbd_422_32x32_avx2
Line
Count
Source
101
386
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
386
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
386
                                               output_q3, width, height); \
104
386
  }
cfl_subsample_lbd_422_32x16_avx2
Line
Count
Source
101
175
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
175
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
175
                                               output_q3, width, height); \
104
175
  }
cfl_subsample_lbd_422_32x8_avx2
Line
Count
Source
101
472
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
472
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
472
                                               output_q3, width, height); \
104
472
  }
cfl_subsample_lbd_444_32x32_avx2
Line
Count
Source
101
21.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
21.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
21.3k
                                               output_q3, width, height); \
104
21.3k
  }
cfl_subsample_lbd_444_32x16_avx2
Line
Count
Source
101
9.36k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
9.36k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
9.36k
                                               output_q3, width, height); \
104
9.36k
  }
cfl_subsample_lbd_444_32x8_avx2
Line
Count
Source
101
15.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
15.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
15.4k
                                               output_q3, width, height); \
104
15.4k
  }
cfl_subsample_hbd_420_32x32_avx2
Line
Count
Source
101
13.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
13.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
13.7k
                                               output_q3, width, height); \
104
13.7k
  }
cfl_subsample_hbd_420_32x16_avx2
Line
Count
Source
101
5.08k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
5.08k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
5.08k
                                               output_q3, width, height); \
104
5.08k
  }
cfl_subsample_hbd_420_32x8_avx2
Line
Count
Source
101
7.85k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
7.85k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
7.85k
                                               output_q3, width, height); \
104
7.85k
  }
cfl_subsample_hbd_422_32x32_avx2
Line
Count
Source
101
11
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
11
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
11
                                               output_q3, width, height); \
104
11
  }
cfl_subsample_hbd_422_32x16_avx2
Line
Count
Source
101
54
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
54
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
54
                                               output_q3, width, height); \
104
54
  }
cfl_subsample_hbd_422_32x8_avx2
Line
Count
Source
101
45
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
45
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
45
                                               output_q3, width, height); \
104
45
  }
cfl_subsample_hbd_444_32x32_avx2
Line
Count
Source
101
19.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
19.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
19.4k
                                               output_q3, width, height); \
104
19.4k
  }
cfl_subsample_hbd_444_32x16_avx2
Line
Count
Source
101
12.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
12.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
12.6k
                                               output_q3, width, height); \
104
12.6k
  }
cfl_subsample_hbd_444_32x8_avx2
Line
Count
Source
101
18.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
102
18.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
103
18.3k
                                               output_q3, width, height); \
104
18.3k
  }
105
106
// Declare size-specific wrappers for all valid CfL sizes.
107
#define CFL_SUBSAMPLE_FUNCTIONS(arch, sub, bd)                            \
108
  CFL_SUBSAMPLE(arch, sub, bd, 4, 4)                                      \
109
  CFL_SUBSAMPLE(arch, sub, bd, 8, 8)                                      \
110
  CFL_SUBSAMPLE(arch, sub, bd, 16, 16)                                    \
111
  CFL_SUBSAMPLE(arch, sub, bd, 32, 32)                                    \
112
  CFL_SUBSAMPLE(arch, sub, bd, 4, 8)                                      \
113
  CFL_SUBSAMPLE(arch, sub, bd, 8, 4)                                      \
114
  CFL_SUBSAMPLE(arch, sub, bd, 8, 16)                                     \
115
  CFL_SUBSAMPLE(arch, sub, bd, 16, 8)                                     \
116
  CFL_SUBSAMPLE(arch, sub, bd, 16, 32)                                    \
117
  CFL_SUBSAMPLE(arch, sub, bd, 32, 16)                                    \
118
  CFL_SUBSAMPLE(arch, sub, bd, 4, 16)                                     \
119
  CFL_SUBSAMPLE(arch, sub, bd, 16, 4)                                     \
120
  CFL_SUBSAMPLE(arch, sub, bd, 8, 32)                                     \
121
  CFL_SUBSAMPLE(arch, sub, bd, 32, 8)                                     \
122
  cfl_subsample_##bd##_fn cfl_get_luma_subsampling_##sub##_##bd##_##arch( \
123
0
      TX_SIZE tx_size) {                                                  \
124
0
    CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
125
0
    return subfn_##sub[tx_size];                                          \
126
0
  }
127
128
// Declare an architecture-specific array of function pointers for size-specific
129
// wrappers.
130
#define CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
131
0
  static const cfl_subsample_##bd##_fn subfn_##sub[TX_SIZES_ALL] = {          \
132
0
    cfl_subsample_##bd##_##sub##_4x4_##arch,   /* 4x4 */                      \
133
0
    cfl_subsample_##bd##_##sub##_8x8_##arch,   /* 8x8 */                      \
134
0
    cfl_subsample_##bd##_##sub##_16x16_##arch, /* 16x16 */                    \
135
0
    cfl_subsample_##bd##_##sub##_32x32_##arch, /* 32x32 */                    \
136
0
    NULL,                                      /* 64x64 (invalid CFL size) */ \
137
0
    cfl_subsample_##bd##_##sub##_4x8_##arch,   /* 4x8 */                      \
138
0
    cfl_subsample_##bd##_##sub##_8x4_##arch,   /* 8x4 */                      \
139
0
    cfl_subsample_##bd##_##sub##_8x16_##arch,  /* 8x16 */                     \
140
0
    cfl_subsample_##bd##_##sub##_16x8_##arch,  /* 16x8 */                     \
141
0
    cfl_subsample_##bd##_##sub##_16x32_##arch, /* 16x32 */                    \
142
0
    cfl_subsample_##bd##_##sub##_32x16_##arch, /* 32x16 */                    \
143
0
    NULL,                                      /* 32x64 (invalid CFL size) */ \
144
0
    NULL,                                      /* 64x32 (invalid CFL size) */ \
145
0
    cfl_subsample_##bd##_##sub##_4x16_##arch,  /* 4x16  */                    \
146
0
    cfl_subsample_##bd##_##sub##_16x4_##arch,  /* 16x4  */                    \
147
0
    cfl_subsample_##bd##_##sub##_8x32_##arch,  /* 8x32  */                    \
148
0
    cfl_subsample_##bd##_##sub##_32x8_##arch,  /* 32x8  */                    \
149
0
    NULL,                                      /* 16x64 (invalid CFL size) */ \
150
0
    NULL,                                      /* 64x16 (invalid CFL size) */ \
151
0
  };
152
153
// The RTCD script does not support passing in an array, so we wrap it in this
154
// function.
155
#if CONFIG_AV1_HIGHBITDEPTH
156
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
157
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
158
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
159
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd) \
160
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, hbd) \
161
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, hbd) \
162
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, hbd)
163
#else
164
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
165
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
166
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
167
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd)
168
#endif
169
170
// Declare a size-specific wrapper for the size-generic function. The compiler
171
// will inline the size generic function in here, the advantage is that the size
172
// will be constant allowing for loop unrolling and other constant propagated
173
// goodness.
174
#define CFL_SUB_AVG_X(arch, width, height, round_offset, num_pel_log2)       \
175
  void cfl_subtract_average_##width##x##height##_##arch(const uint16_t *src, \
176
                                                        int16_t *dst);       \
177
  void cfl_subtract_average_##width##x##height##_##arch(const uint16_t *src, \
178
1.56M
                                                        int16_t *dst) {      \
179
1.56M
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
1.56M
                            num_pel_log2);                                   \
181
1.56M
  }
Unexecuted instantiation: cfl_subtract_average_4x4_c
Unexecuted instantiation: cfl_subtract_average_4x8_c
Unexecuted instantiation: cfl_subtract_average_4x16_c
Unexecuted instantiation: cfl_subtract_average_8x4_c
Unexecuted instantiation: cfl_subtract_average_8x8_c
Unexecuted instantiation: cfl_subtract_average_8x16_c
Unexecuted instantiation: cfl_subtract_average_8x32_c
Unexecuted instantiation: cfl_subtract_average_16x4_c
Unexecuted instantiation: cfl_subtract_average_16x8_c
Unexecuted instantiation: cfl_subtract_average_16x16_c
Unexecuted instantiation: cfl_subtract_average_16x32_c
Unexecuted instantiation: cfl_subtract_average_32x8_c
Unexecuted instantiation: cfl_subtract_average_32x16_c
Unexecuted instantiation: cfl_subtract_average_32x32_c
cfl_subtract_average_4x4_sse2
Line
Count
Source
178
239k
                                                        int16_t *dst) {      \
179
239k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
239k
                            num_pel_log2);                                   \
181
239k
  }
cfl_subtract_average_4x8_sse2
Line
Count
Source
178
89.1k
                                                        int16_t *dst) {      \
179
89.1k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
89.1k
                            num_pel_log2);                                   \
181
89.1k
  }
cfl_subtract_average_4x16_sse2
Line
Count
Source
178
292k
                                                        int16_t *dst) {      \
179
292k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
292k
                            num_pel_log2);                                   \
181
292k
  }
cfl_subtract_average_8x4_sse2
Line
Count
Source
178
146k
                                                        int16_t *dst) {      \
179
146k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
146k
                            num_pel_log2);                                   \
181
146k
  }
cfl_subtract_average_8x8_sse2
Line
Count
Source
178
215k
                                                        int16_t *dst) {      \
179
215k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
215k
                            num_pel_log2);                                   \
181
215k
  }
cfl_subtract_average_8x16_sse2
Line
Count
Source
178
71.5k
                                                        int16_t *dst) {      \
179
71.5k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
71.5k
                            num_pel_log2);                                   \
181
71.5k
  }
cfl_subtract_average_8x32_sse2
Line
Count
Source
178
35.4k
                                                        int16_t *dst) {      \
179
35.4k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
35.4k
                            num_pel_log2);                                   \
181
35.4k
  }
Unexecuted instantiation: cfl_subtract_average_16x4_sse2
Unexecuted instantiation: cfl_subtract_average_16x8_sse2
Unexecuted instantiation: cfl_subtract_average_16x16_sse2
Unexecuted instantiation: cfl_subtract_average_16x32_sse2
Unexecuted instantiation: cfl_subtract_average_32x8_sse2
Unexecuted instantiation: cfl_subtract_average_32x16_sse2
Unexecuted instantiation: cfl_subtract_average_32x32_sse2
cfl_subtract_average_16x4_avx2
Line
Count
Source
178
119k
                                                        int16_t *dst) {      \
179
119k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
119k
                            num_pel_log2);                                   \
181
119k
  }
cfl_subtract_average_16x8_avx2
Line
Count
Source
178
99.4k
                                                        int16_t *dst) {      \
179
99.4k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
99.4k
                            num_pel_log2);                                   \
181
99.4k
  }
cfl_subtract_average_16x16_avx2
Line
Count
Source
178
123k
                                                        int16_t *dst) {      \
179
123k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
123k
                            num_pel_log2);                                   \
181
123k
  }
cfl_subtract_average_16x32_avx2
Line
Count
Source
178
30.6k
                                                        int16_t *dst) {      \
179
30.6k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
30.6k
                            num_pel_log2);                                   \
181
30.6k
  }
cfl_subtract_average_32x8_avx2
Line
Count
Source
178
34.0k
                                                        int16_t *dst) {      \
179
34.0k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
34.0k
                            num_pel_log2);                                   \
181
34.0k
  }
cfl_subtract_average_32x16_avx2
Line
Count
Source
178
22.1k
                                                        int16_t *dst) {      \
179
22.1k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
22.1k
                            num_pel_log2);                                   \
181
22.1k
  }
cfl_subtract_average_32x32_avx2
Line
Count
Source
178
41.2k
                                                        int16_t *dst) {      \
179
41.2k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
180
41.2k
                            num_pel_log2);                                   \
181
41.2k
  }
182
183
// Declare size-specific wrappers for all valid CfL sizes.
184
#define CFL_SUB_AVG_FN(arch)                                              \
185
  CFL_SUB_AVG_X(arch, 4, 4, 8, 4)                                         \
186
  CFL_SUB_AVG_X(arch, 4, 8, 16, 5)                                        \
187
  CFL_SUB_AVG_X(arch, 4, 16, 32, 6)                                       \
188
  CFL_SUB_AVG_X(arch, 8, 4, 16, 5)                                        \
189
  CFL_SUB_AVG_X(arch, 8, 8, 32, 6)                                        \
190
  CFL_SUB_AVG_X(arch, 8, 16, 64, 7)                                       \
191
  CFL_SUB_AVG_X(arch, 8, 32, 128, 8)                                      \
192
  CFL_SUB_AVG_X(arch, 16, 4, 32, 6)                                       \
193
  CFL_SUB_AVG_X(arch, 16, 8, 64, 7)                                       \
194
  CFL_SUB_AVG_X(arch, 16, 16, 128, 8)                                     \
195
  CFL_SUB_AVG_X(arch, 16, 32, 256, 9)                                     \
196
  CFL_SUB_AVG_X(arch, 32, 8, 128, 8)                                      \
197
  CFL_SUB_AVG_X(arch, 32, 16, 256, 9)                                     \
198
  CFL_SUB_AVG_X(arch, 32, 32, 512, 10)                                    \
199
  cfl_subtract_average_fn cfl_get_subtract_average_fn_##arch(             \
200
0
      TX_SIZE tx_size) {                                                  \
201
0
    static const cfl_subtract_average_fn sub_avg[TX_SIZES_ALL] = {        \
202
0
      cfl_subtract_average_4x4_##arch,   /* 4x4 */                        \
203
0
      cfl_subtract_average_8x8_##arch,   /* 8x8 */                        \
204
0
      cfl_subtract_average_16x16_##arch, /* 16x16 */                      \
205
0
      cfl_subtract_average_32x32_##arch, /* 32x32 */                      \
206
0
      NULL,                              /* 64x64 (invalid CFL size) */   \
207
0
      cfl_subtract_average_4x8_##arch,   /* 4x8 */                        \
208
0
      cfl_subtract_average_8x4_##arch,   /* 8x4 */                        \
209
0
      cfl_subtract_average_8x16_##arch,  /* 8x16 */                       \
210
0
      cfl_subtract_average_16x8_##arch,  /* 16x8 */                       \
211
0
      cfl_subtract_average_16x32_##arch, /* 16x32 */                      \
212
0
      cfl_subtract_average_32x16_##arch, /* 32x16 */                      \
213
0
      NULL,                              /* 32x64 (invalid CFL size) */   \
214
0
      NULL,                              /* 64x32 (invalid CFL size) */   \
215
0
      cfl_subtract_average_4x16_##arch,  /* 4x16 (invalid CFL size) */    \
216
0
      cfl_subtract_average_16x4_##arch,  /* 16x4 (invalid CFL size) */    \
217
0
      cfl_subtract_average_8x32_##arch,  /* 8x32 (invalid CFL size) */    \
218
0
      cfl_subtract_average_32x8_##arch,  /* 32x8 (invalid CFL size) */    \
219
0
      NULL,                              /* 16x64 (invalid CFL size) */   \
220
0
      NULL,                              /* 64x16 (invalid CFL size) */   \
221
0
    };                                                                    \
222
0
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */ \
223
0
    /* index the function pointer array out of bounds. */                 \
224
0
    return sub_avg[tx_size % TX_SIZES_ALL];                               \
225
0
  }
226
227
#define CFL_PREDICT_lbd(arch, width, height)                                   \
228
  void cfl_predict_lbd_##width##x##height##_##arch(                            \
229
      const int16_t *pred_buf_q3, uint8_t *dst, int dst_stride, int alpha_q3); \
230
  void cfl_predict_lbd_##width##x##height##_##arch(                            \
231
      const int16_t *pred_buf_q3, uint8_t *dst, int dst_stride,                \
232
1.81M
      int alpha_q3) {                                                          \
233
1.81M
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
1.81M
                           height);                                            \
235
1.81M
  }
Unexecuted instantiation: cfl_predict_lbd_4x4_c
Unexecuted instantiation: cfl_predict_lbd_4x8_c
Unexecuted instantiation: cfl_predict_lbd_4x16_c
Unexecuted instantiation: cfl_predict_lbd_8x4_c
Unexecuted instantiation: cfl_predict_lbd_8x8_c
Unexecuted instantiation: cfl_predict_lbd_8x16_c
Unexecuted instantiation: cfl_predict_lbd_8x32_c
Unexecuted instantiation: cfl_predict_lbd_16x4_c
Unexecuted instantiation: cfl_predict_lbd_16x8_c
Unexecuted instantiation: cfl_predict_lbd_16x16_c
Unexecuted instantiation: cfl_predict_lbd_16x32_c
Unexecuted instantiation: cfl_predict_lbd_32x8_c
Unexecuted instantiation: cfl_predict_lbd_32x16_c
Unexecuted instantiation: cfl_predict_lbd_32x32_c
cfl_predict_lbd_4x4_ssse3
Line
Count
Source
232
238k
      int alpha_q3) {                                                          \
233
238k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
238k
                           height);                                            \
235
238k
  }
cfl_predict_lbd_4x8_ssse3
Line
Count
Source
232
97.4k
      int alpha_q3) {                                                          \
233
97.4k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
97.4k
                           height);                                            \
235
97.4k
  }
cfl_predict_lbd_4x16_ssse3
Line
Count
Source
232
517k
      int alpha_q3) {                                                          \
233
517k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
517k
                           height);                                            \
235
517k
  }
cfl_predict_lbd_8x4_ssse3
Line
Count
Source
232
144k
      int alpha_q3) {                                                          \
233
144k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
144k
                           height);                                            \
235
144k
  }
cfl_predict_lbd_8x8_ssse3
Line
Count
Source
232
218k
      int alpha_q3) {                                                          \
233
218k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
218k
                           height);                                            \
235
218k
  }
cfl_predict_lbd_8x16_ssse3
Line
Count
Source
232
64.8k
      int alpha_q3) {                                                          \
233
64.8k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
64.8k
                           height);                                            \
235
64.8k
  }
cfl_predict_lbd_8x32_ssse3
Line
Count
Source
232
39.9k
      int alpha_q3) {                                                          \
233
39.9k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
39.9k
                           height);                                            \
235
39.9k
  }
cfl_predict_lbd_16x4_ssse3
Line
Count
Source
232
137k
      int alpha_q3) {                                                          \
233
137k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
137k
                           height);                                            \
235
137k
  }
cfl_predict_lbd_16x8_ssse3
Line
Count
Source
232
93.3k
      int alpha_q3) {                                                          \
233
93.3k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
93.3k
                           height);                                            \
235
93.3k
  }
cfl_predict_lbd_16x16_ssse3
Line
Count
Source
232
124k
      int alpha_q3) {                                                          \
233
124k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
124k
                           height);                                            \
235
124k
  }
cfl_predict_lbd_16x32_ssse3
Line
Count
Source
232
43.1k
      int alpha_q3) {                                                          \
233
43.1k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
43.1k
                           height);                                            \
235
43.1k
  }
Unexecuted instantiation: cfl_predict_lbd_32x8_ssse3
Unexecuted instantiation: cfl_predict_lbd_32x16_ssse3
Unexecuted instantiation: cfl_predict_lbd_32x32_ssse3
cfl_predict_lbd_32x8_avx2
Line
Count
Source
232
31.0k
      int alpha_q3) {                                                          \
233
31.0k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
31.0k
                           height);                                            \
235
31.0k
  }
cfl_predict_lbd_32x16_avx2
Line
Count
Source
232
18.8k
      int alpha_q3) {                                                          \
233
18.8k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
18.8k
                           height);                                            \
235
18.8k
  }
cfl_predict_lbd_32x32_avx2
Line
Count
Source
232
42.9k
      int alpha_q3) {                                                          \
233
42.9k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width,      \
234
42.9k
                           height);                                            \
235
42.9k
  }
236
237
#if CONFIG_AV1_HIGHBITDEPTH
238
#define CFL_PREDICT_hbd(arch, width, height)                                   \
239
  void cfl_predict_hbd_##width##x##height##_##arch(                            \
240
      const int16_t *pred_buf_q3, uint16_t *dst, int dst_stride, int alpha_q3, \
241
      int bd);                                                                 \
242
  void cfl_predict_hbd_##width##x##height##_##arch(                            \
243
      const int16_t *pred_buf_q3, uint16_t *dst, int dst_stride, int alpha_q3, \
244
1.30M
      int bd) {                                                                \
245
1.30M
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
1.30M
                           height);                                            \
247
1.30M
  }
Unexecuted instantiation: cfl_predict_hbd_4x4_c
Unexecuted instantiation: cfl_predict_hbd_4x8_c
Unexecuted instantiation: cfl_predict_hbd_4x16_c
Unexecuted instantiation: cfl_predict_hbd_8x4_c
Unexecuted instantiation: cfl_predict_hbd_8x8_c
Unexecuted instantiation: cfl_predict_hbd_8x16_c
Unexecuted instantiation: cfl_predict_hbd_8x32_c
Unexecuted instantiation: cfl_predict_hbd_16x4_c
Unexecuted instantiation: cfl_predict_hbd_16x8_c
Unexecuted instantiation: cfl_predict_hbd_16x16_c
Unexecuted instantiation: cfl_predict_hbd_16x32_c
Unexecuted instantiation: cfl_predict_hbd_32x8_c
Unexecuted instantiation: cfl_predict_hbd_32x16_c
Unexecuted instantiation: cfl_predict_hbd_32x32_c
cfl_predict_hbd_4x4_ssse3
Line
Count
Source
244
241k
      int bd) {                                                                \
245
241k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
241k
                           height);                                            \
247
241k
  }
cfl_predict_hbd_4x8_ssse3
Line
Count
Source
244
80.8k
      int bd) {                                                                \
245
80.8k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
80.8k
                           height);                                            \
247
80.8k
  }
cfl_predict_hbd_4x16_ssse3
Line
Count
Source
244
67.0k
      int bd) {                                                                \
245
67.0k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
67.0k
                           height);                                            \
247
67.0k
  }
cfl_predict_hbd_8x4_ssse3
Line
Count
Source
244
149k
      int bd) {                                                                \
245
149k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
149k
                           height);                                            \
247
149k
  }
cfl_predict_hbd_8x8_ssse3
Line
Count
Source
244
212k
      int bd) {                                                                \
245
212k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
212k
                           height);                                            \
247
212k
  }
cfl_predict_hbd_8x16_ssse3
Line
Count
Source
244
78.2k
      int bd) {                                                                \
245
78.2k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
78.2k
                           height);                                            \
247
78.2k
  }
cfl_predict_hbd_8x32_ssse3
Line
Count
Source
244
30.8k
      int bd) {                                                                \
245
30.8k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
30.8k
                           height);                                            \
247
30.8k
  }
Unexecuted instantiation: cfl_predict_hbd_16x4_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x8_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x16_ssse3
Unexecuted instantiation: cfl_predict_hbd_16x32_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x8_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x16_ssse3
Unexecuted instantiation: cfl_predict_hbd_32x32_ssse3
cfl_predict_hbd_16x4_avx2
Line
Count
Source
244
101k
      int bd) {                                                                \
245
101k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
101k
                           height);                                            \
247
101k
  }
cfl_predict_hbd_16x8_avx2
Line
Count
Source
244
105k
      int bd) {                                                                \
245
105k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
105k
                           height);                                            \
247
105k
  }
cfl_predict_hbd_16x16_avx2
Line
Count
Source
244
122k
      int bd) {                                                                \
245
122k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
122k
                           height);                                            \
247
122k
  }
cfl_predict_hbd_16x32_avx2
Line
Count
Source
244
18.1k
      int bd) {                                                                \
245
18.1k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
18.1k
                           height);                                            \
247
18.1k
  }
cfl_predict_hbd_32x8_avx2
Line
Count
Source
244
36.9k
      int bd) {                                                                \
245
36.9k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
36.9k
                           height);                                            \
247
36.9k
  }
cfl_predict_hbd_32x16_avx2
Line
Count
Source
244
25.5k
      int bd) {                                                                \
245
25.5k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
25.5k
                           height);                                            \
247
25.5k
  }
cfl_predict_hbd_32x32_avx2
Line
Count
Source
244
39.4k
      int bd) {                                                                \
245
39.4k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
246
39.4k
                           height);                                            \
247
39.4k
  }
248
#endif
249
250
// This wrapper exists because clang format does not like calling macros with
251
// lowercase letters.
252
#define CFL_PREDICT_X(arch, width, height, bd) \
253
  CFL_PREDICT_##bd(arch, width, height)
254
255
#define CFL_PREDICT_FN(arch, bd)                                            \
256
  CFL_PREDICT_X(arch, 4, 4, bd)                                             \
257
  CFL_PREDICT_X(arch, 4, 8, bd)                                             \
258
  CFL_PREDICT_X(arch, 4, 16, bd)                                            \
259
  CFL_PREDICT_X(arch, 8, 4, bd)                                             \
260
  CFL_PREDICT_X(arch, 8, 8, bd)                                             \
261
  CFL_PREDICT_X(arch, 8, 16, bd)                                            \
262
  CFL_PREDICT_X(arch, 8, 32, bd)                                            \
263
  CFL_PREDICT_X(arch, 16, 4, bd)                                            \
264
  CFL_PREDICT_X(arch, 16, 8, bd)                                            \
265
  CFL_PREDICT_X(arch, 16, 16, bd)                                           \
266
  CFL_PREDICT_X(arch, 16, 32, bd)                                           \
267
  CFL_PREDICT_X(arch, 32, 8, bd)                                            \
268
  CFL_PREDICT_X(arch, 32, 16, bd)                                           \
269
  CFL_PREDICT_X(arch, 32, 32, bd)                                           \
270
0
  cfl_predict_##bd##_fn cfl_get_predict_##bd##_fn_##arch(TX_SIZE tx_size) { \
271
0
    static const cfl_predict_##bd##_fn pred[TX_SIZES_ALL] = {               \
272
0
      cfl_predict_##bd##_4x4_##arch,   /* 4x4 */                            \
273
0
      cfl_predict_##bd##_8x8_##arch,   /* 8x8 */                            \
274
0
      cfl_predict_##bd##_16x16_##arch, /* 16x16 */                          \
275
0
      cfl_predict_##bd##_32x32_##arch, /* 32x32 */                          \
276
0
      NULL,                            /* 64x64 (invalid CFL size) */       \
277
0
      cfl_predict_##bd##_4x8_##arch,   /* 4x8 */                            \
278
0
      cfl_predict_##bd##_8x4_##arch,   /* 8x4 */                            \
279
0
      cfl_predict_##bd##_8x16_##arch,  /* 8x16 */                           \
280
0
      cfl_predict_##bd##_16x8_##arch,  /* 16x8 */                           \
281
0
      cfl_predict_##bd##_16x32_##arch, /* 16x32 */                          \
282
0
      cfl_predict_##bd##_32x16_##arch, /* 32x16 */                          \
283
0
      NULL,                            /* 32x64 (invalid CFL size) */       \
284
0
      NULL,                            /* 64x32 (invalid CFL size) */       \
285
0
      cfl_predict_##bd##_4x16_##arch,  /* 4x16  */                          \
286
0
      cfl_predict_##bd##_16x4_##arch,  /* 16x4  */                          \
287
0
      cfl_predict_##bd##_8x32_##arch,  /* 8x32  */                          \
288
0
      cfl_predict_##bd##_32x8_##arch,  /* 32x8  */                          \
289
0
      NULL,                            /* 16x64 (invalid CFL size) */       \
290
0
      NULL,                            /* 64x16 (invalid CFL size) */       \
291
0
    };                                                                      \
292
0
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */   \
293
0
    /* index the function pointer array out of bounds. */                   \
294
0
    return pred[tx_size % TX_SIZES_ALL];                                    \
295
0
  }
296
297
#endif  // AOM_AV1_COMMON_CFL_H_