Coverage Report

Created: 2022-08-24 06:17

/src/aom/av1/common/cfl.h
Line
Count
Source (jump to first uncovered line)
1
/*
2
 * Copyright (c) 2016, Alliance for Open Media. All rights reserved
3
 *
4
 * This source code is subject to the terms of the BSD 2 Clause License and
5
 * the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
6
 * was not distributed with this source code in the LICENSE file, you can
7
 * obtain it at www.aomedia.org/license/software. If the Alliance for Open
8
 * Media Patent License 1.0 was not distributed with this source code in the
9
 * PATENTS file, you can obtain it at www.aomedia.org/license/patent.
10
 */
11
12
#ifndef AOM_AV1_COMMON_CFL_H_
13
#define AOM_AV1_COMMON_CFL_H_
14
15
#include "av1/common/av1_common_int.h"
16
#include "av1/common/blockd.h"
17
18
// Can we use CfL for the current block?
19
3.65M
static INLINE CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
3.65M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
3.65M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
3.65M
  assert(bsize < BLOCK_SIZES_ALL);
23
3.65M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
6.29k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
6.29k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
6.29k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
6.29k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
6.29k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
3.64M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
3.64M
                            block_size_high[bsize] <= 32);
34
3.65M
}
Unexecuted instantiation: decodeframe.c:is_cfl_allowed
decodemv.c:is_cfl_allowed
Line
Count
Source
19
3.65M
static INLINE CFL_ALLOWED_TYPE is_cfl_allowed(const MACROBLOCKD *xd) {
20
3.65M
  const MB_MODE_INFO *mbmi = xd->mi[0];
21
3.65M
  const BLOCK_SIZE bsize = mbmi->bsize;
22
3.65M
  assert(bsize < BLOCK_SIZES_ALL);
23
3.65M
  if (xd->lossless[mbmi->segment_id]) {
24
    // In lossless, CfL is available when the partition size is equal to the
25
    // transform size.
26
6.29k
    const int ssx = xd->plane[AOM_PLANE_U].subsampling_x;
27
6.29k
    const int ssy = xd->plane[AOM_PLANE_U].subsampling_y;
28
6.29k
    const int plane_bsize = get_plane_block_size(bsize, ssx, ssy);
29
6.29k
    return (CFL_ALLOWED_TYPE)(plane_bsize == BLOCK_4X4);
30
6.29k
  }
31
  // Spec: CfL is available to luma partitions lesser than or equal to 32x32
32
3.64M
  return (CFL_ALLOWED_TYPE)(block_size_wide[bsize] <= 32 &&
33
3.64M
                            block_size_high[bsize] <= 32);
34
3.65M
}
Unexecuted instantiation: bitstream.c:is_cfl_allowed
Unexecuted instantiation: encoder.c:is_cfl_allowed
Unexecuted instantiation: encoder_utils.c:is_cfl_allowed
Unexecuted instantiation: encodetxb.c:is_cfl_allowed
Unexecuted instantiation: ethread.c:is_cfl_allowed
Unexecuted instantiation: global_motion_facade.c:is_cfl_allowed
Unexecuted instantiation: mcomp.c:is_cfl_allowed
Unexecuted instantiation: palette.c:is_cfl_allowed
Unexecuted instantiation: rdopt.c:is_cfl_allowed
Unexecuted instantiation: speed_features.c:is_cfl_allowed
Unexecuted instantiation: superres_scale.c:is_cfl_allowed
Unexecuted instantiation: svc_layercontext.c:is_cfl_allowed
Unexecuted instantiation: tokenize.c:is_cfl_allowed
Unexecuted instantiation: tpl_model.c:is_cfl_allowed
Unexecuted instantiation: tx_search.c:is_cfl_allowed
Unexecuted instantiation: intra_mode_search.c:is_cfl_allowed
Unexecuted instantiation: cfl.c:is_cfl_allowed
Unexecuted instantiation: reconintra.c:is_cfl_allowed
Unexecuted instantiation: allintra_vis.c:is_cfl_allowed
Unexecuted instantiation: compound_type.c:is_cfl_allowed
Unexecuted instantiation: encodeframe.c:is_cfl_allowed
Unexecuted instantiation: encodeframe_utils.c:is_cfl_allowed
Unexecuted instantiation: encodemb.c:is_cfl_allowed
Unexecuted instantiation: encode_strategy.c:is_cfl_allowed
Unexecuted instantiation: interp_search.c:is_cfl_allowed
Unexecuted instantiation: motion_search_facade.c:is_cfl_allowed
Unexecuted instantiation: partition_search.c:is_cfl_allowed
Unexecuted instantiation: partition_strategy.c:is_cfl_allowed
Unexecuted instantiation: nonrd_pickmode.c:is_cfl_allowed
35
36
// Do we need to save the luma pixels from the current block,
37
// for a possible future CfL prediction?
38
static INLINE CFL_ALLOWED_TYPE store_cfl_required(const AV1_COMMON *cm,
39
9.66M
                                                  const MACROBLOCKD *xd) {
40
9.66M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
9.66M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
9.66M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
1.41M
    return CFL_ALLOWED;
51
1.41M
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
8.25M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
8.25M
                            mbmi->uv_mode == UV_CFL_PRED);
57
9.66M
}
decodeframe.c:store_cfl_required
Line
Count
Source
39
5.31M
                                                  const MACROBLOCKD *xd) {
40
5.31M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
5.31M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
5.31M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
713k
    return CFL_ALLOWED;
51
713k
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
4.60M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
4.60M
                            mbmi->uv_mode == UV_CFL_PRED);
57
5.31M
}
decodemv.c:store_cfl_required
Line
Count
Source
39
4.35M
                                                  const MACROBLOCKD *xd) {
40
4.35M
  const MB_MODE_INFO *mbmi = xd->mi[0];
41
42
4.35M
  if (cm->seq_params->monochrome) return CFL_DISALLOWED;
43
44
4.35M
  if (!xd->is_chroma_ref) {
45
    // For non-chroma-reference blocks, we should always store the luma pixels,
46
    // in case the corresponding chroma-reference block uses CfL.
47
    // Note that this can only happen for block sizes which are <8 on
48
    // their shortest side, as otherwise they would be chroma reference
49
    // blocks.
50
697k
    return CFL_ALLOWED;
51
697k
  }
52
53
  // If this block has chroma information, we know whether we're
54
  // actually going to perform a CfL prediction
55
3.65M
  return (CFL_ALLOWED_TYPE)(!is_inter_block(mbmi) &&
56
3.65M
                            mbmi->uv_mode == UV_CFL_PRED);
57
4.35M
}
Unexecuted instantiation: bitstream.c:store_cfl_required
Unexecuted instantiation: encoder.c:store_cfl_required
Unexecuted instantiation: encoder_utils.c:store_cfl_required
Unexecuted instantiation: encodetxb.c:store_cfl_required
Unexecuted instantiation: ethread.c:store_cfl_required
Unexecuted instantiation: global_motion_facade.c:store_cfl_required
Unexecuted instantiation: mcomp.c:store_cfl_required
Unexecuted instantiation: palette.c:store_cfl_required
Unexecuted instantiation: rdopt.c:store_cfl_required
Unexecuted instantiation: speed_features.c:store_cfl_required
Unexecuted instantiation: superres_scale.c:store_cfl_required
Unexecuted instantiation: svc_layercontext.c:store_cfl_required
Unexecuted instantiation: tokenize.c:store_cfl_required
Unexecuted instantiation: tpl_model.c:store_cfl_required
Unexecuted instantiation: tx_search.c:store_cfl_required
Unexecuted instantiation: intra_mode_search.c:store_cfl_required
Unexecuted instantiation: cfl.c:store_cfl_required
Unexecuted instantiation: reconintra.c:store_cfl_required
Unexecuted instantiation: allintra_vis.c:store_cfl_required
Unexecuted instantiation: compound_type.c:store_cfl_required
Unexecuted instantiation: encodeframe.c:store_cfl_required
Unexecuted instantiation: encodeframe_utils.c:store_cfl_required
Unexecuted instantiation: encodemb.c:store_cfl_required
Unexecuted instantiation: encode_strategy.c:store_cfl_required
Unexecuted instantiation: interp_search.c:store_cfl_required
Unexecuted instantiation: motion_search_facade.c:store_cfl_required
Unexecuted instantiation: partition_search.c:store_cfl_required
Unexecuted instantiation: partition_strategy.c:store_cfl_required
Unexecuted instantiation: nonrd_pickmode.c:store_cfl_required
58
59
86.3M
static INLINE int get_scaled_luma_q0(int alpha_q3, int16_t pred_buf_q3) {
60
86.3M
  int scaled_luma_q6 = alpha_q3 * pred_buf_q3;
61
86.3M
  return ROUND_POWER_OF_TWO_SIGNED(scaled_luma_q6, 6);
62
86.3M
}
Unexecuted instantiation: decodeframe.c:get_scaled_luma_q0
Unexecuted instantiation: decodemv.c:get_scaled_luma_q0
Unexecuted instantiation: bitstream.c:get_scaled_luma_q0
Unexecuted instantiation: encoder.c:get_scaled_luma_q0
Unexecuted instantiation: encoder_utils.c:get_scaled_luma_q0
Unexecuted instantiation: encodetxb.c:get_scaled_luma_q0
Unexecuted instantiation: ethread.c:get_scaled_luma_q0
Unexecuted instantiation: global_motion_facade.c:get_scaled_luma_q0
Unexecuted instantiation: mcomp.c:get_scaled_luma_q0
Unexecuted instantiation: palette.c:get_scaled_luma_q0
Unexecuted instantiation: rdopt.c:get_scaled_luma_q0
Unexecuted instantiation: speed_features.c:get_scaled_luma_q0
Unexecuted instantiation: superres_scale.c:get_scaled_luma_q0
Unexecuted instantiation: svc_layercontext.c:get_scaled_luma_q0
Unexecuted instantiation: tokenize.c:get_scaled_luma_q0
Unexecuted instantiation: tpl_model.c:get_scaled_luma_q0
Unexecuted instantiation: tx_search.c:get_scaled_luma_q0
Unexecuted instantiation: intra_mode_search.c:get_scaled_luma_q0
cfl.c:get_scaled_luma_q0
Line
Count
Source
59
86.3M
static INLINE int get_scaled_luma_q0(int alpha_q3, int16_t pred_buf_q3) {
60
86.3M
  int scaled_luma_q6 = alpha_q3 * pred_buf_q3;
61
86.3M
  return ROUND_POWER_OF_TWO_SIGNED(scaled_luma_q6, 6);
62
86.3M
}
Unexecuted instantiation: reconintra.c:get_scaled_luma_q0
Unexecuted instantiation: allintra_vis.c:get_scaled_luma_q0
Unexecuted instantiation: compound_type.c:get_scaled_luma_q0
Unexecuted instantiation: encodeframe.c:get_scaled_luma_q0
Unexecuted instantiation: encodeframe_utils.c:get_scaled_luma_q0
Unexecuted instantiation: encodemb.c:get_scaled_luma_q0
Unexecuted instantiation: encode_strategy.c:get_scaled_luma_q0
Unexecuted instantiation: interp_search.c:get_scaled_luma_q0
Unexecuted instantiation: motion_search_facade.c:get_scaled_luma_q0
Unexecuted instantiation: partition_search.c:get_scaled_luma_q0
Unexecuted instantiation: partition_strategy.c:get_scaled_luma_q0
Unexecuted instantiation: nonrd_pickmode.c:get_scaled_luma_q0
63
64
1.85M
static INLINE CFL_PRED_TYPE get_cfl_pred_type(PLANE_TYPE plane) {
65
1.85M
  assert(plane > 0);
66
1.85M
  return (CFL_PRED_TYPE)(plane - 1);
67
1.85M
}
Unexecuted instantiation: decodeframe.c:get_cfl_pred_type
Unexecuted instantiation: decodemv.c:get_cfl_pred_type
Unexecuted instantiation: bitstream.c:get_cfl_pred_type
Unexecuted instantiation: encoder.c:get_cfl_pred_type
Unexecuted instantiation: encoder_utils.c:get_cfl_pred_type
Unexecuted instantiation: encodetxb.c:get_cfl_pred_type
Unexecuted instantiation: ethread.c:get_cfl_pred_type
Unexecuted instantiation: global_motion_facade.c:get_cfl_pred_type
Unexecuted instantiation: mcomp.c:get_cfl_pred_type
Unexecuted instantiation: palette.c:get_cfl_pred_type
Unexecuted instantiation: rdopt.c:get_cfl_pred_type
Unexecuted instantiation: speed_features.c:get_cfl_pred_type
Unexecuted instantiation: superres_scale.c:get_cfl_pred_type
Unexecuted instantiation: svc_layercontext.c:get_cfl_pred_type
Unexecuted instantiation: tokenize.c:get_cfl_pred_type
Unexecuted instantiation: tpl_model.c:get_cfl_pred_type
Unexecuted instantiation: tx_search.c:get_cfl_pred_type
Unexecuted instantiation: intra_mode_search.c:get_cfl_pred_type
Unexecuted instantiation: cfl.c:get_cfl_pred_type
reconintra.c:get_cfl_pred_type
Line
Count
Source
64
1.85M
static INLINE CFL_PRED_TYPE get_cfl_pred_type(PLANE_TYPE plane) {
65
1.85M
  assert(plane > 0);
66
1.85M
  return (CFL_PRED_TYPE)(plane - 1);
67
1.85M
}
Unexecuted instantiation: allintra_vis.c:get_cfl_pred_type
Unexecuted instantiation: compound_type.c:get_cfl_pred_type
Unexecuted instantiation: encodeframe.c:get_cfl_pred_type
Unexecuted instantiation: encodeframe_utils.c:get_cfl_pred_type
Unexecuted instantiation: encodemb.c:get_cfl_pred_type
Unexecuted instantiation: encode_strategy.c:get_cfl_pred_type
Unexecuted instantiation: interp_search.c:get_cfl_pred_type
Unexecuted instantiation: motion_search_facade.c:get_cfl_pred_type
Unexecuted instantiation: partition_search.c:get_cfl_pred_type
Unexecuted instantiation: partition_strategy.c:get_cfl_pred_type
Unexecuted instantiation: nonrd_pickmode.c:get_cfl_pred_type
68
69
void cfl_predict_block(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
70
                       TX_SIZE tx_size, int plane);
71
72
void cfl_store_block(MACROBLOCKD *const xd, BLOCK_SIZE bsize, TX_SIZE tx_size);
73
74
void cfl_store_tx(MACROBLOCKD *const xd, int row, int col, TX_SIZE tx_size,
75
                  BLOCK_SIZE bsize);
76
77
void cfl_store_dc_pred(MACROBLOCKD *const xd, const uint8_t *input,
78
                       CFL_PRED_TYPE pred_plane, int width);
79
80
void cfl_load_dc_pred(MACROBLOCKD *const xd, uint8_t *dst, int dst_stride,
81
                      TX_SIZE tx_size, CFL_PRED_TYPE pred_plane);
82
83
// Allows the CFL_SUBSAMPLE function to switch types depending on the bitdepth.
84
#define CFL_lbd_TYPE uint8_t *cfl_type
85
#define CFL_hbd_TYPE uint16_t *cfl_type
86
87
// Declare a size-specific wrapper for the size-generic function. The compiler
88
// will inline the size generic function in here, the advantage is that the size
89
// will be constant allowing for loop unrolling and other constant propagated
90
// goodness.
91
#define CFL_SUBSAMPLE(arch, sub, bd, width, height)                       \
92
  void cfl_subsample_##bd##_##sub##_##width##x##height##_##arch(          \
93
1.70M
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
1.70M
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
1.70M
                                               output_q3, width, height); \
96
1.70M
  }
cfl_subsample_lbd_420_4x4_c
Line
Count
Source
93
146k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
146k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
146k
                                               output_q3, width, height); \
96
146k
  }
cfl_subsample_lbd_420_8x8_c
Line
Count
Source
93
170k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
170k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
170k
                                               output_q3, width, height); \
96
170k
  }
cfl_subsample_lbd_420_16x16_c
Line
Count
Source
93
66.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
66.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
66.5k
                                               output_q3, width, height); \
96
66.5k
  }
cfl_subsample_lbd_420_32x32_c
Line
Count
Source
93
21.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
21.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
21.4k
                                               output_q3, width, height); \
96
21.4k
  }
cfl_subsample_lbd_420_4x8_c
Line
Count
Source
93
86.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
86.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
86.0k
                                               output_q3, width, height); \
96
86.0k
  }
cfl_subsample_lbd_420_8x4_c
Line
Count
Source
93
103k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
103k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
103k
                                               output_q3, width, height); \
96
103k
  }
cfl_subsample_lbd_420_8x16_c
Line
Count
Source
93
50.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
50.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
50.5k
                                               output_q3, width, height); \
96
50.5k
  }
cfl_subsample_lbd_420_16x8_c
Line
Count
Source
93
96.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
96.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
96.7k
                                               output_q3, width, height); \
96
96.7k
  }
cfl_subsample_lbd_420_16x32_c
Line
Count
Source
93
11.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
11.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
11.8k
                                               output_q3, width, height); \
96
11.8k
  }
cfl_subsample_lbd_420_32x16_c
Line
Count
Source
93
14.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
14.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
14.5k
                                               output_q3, width, height); \
96
14.5k
  }
cfl_subsample_lbd_420_4x16_c
Line
Count
Source
93
155k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
155k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
155k
                                               output_q3, width, height); \
96
155k
  }
cfl_subsample_lbd_420_16x4_c
Line
Count
Source
93
138k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
138k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
138k
                                               output_q3, width, height); \
96
138k
  }
cfl_subsample_lbd_420_8x32_c
Line
Count
Source
93
19.9k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
19.9k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
19.9k
                                               output_q3, width, height); \
96
19.9k
  }
cfl_subsample_lbd_420_32x8_c
Line
Count
Source
93
26.1k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
26.1k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
26.1k
                                               output_q3, width, height); \
96
26.1k
  }
Unexecuted instantiation: cfl_subsample_lbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_lbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_lbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_lbd_444_32x8_c
cfl_subsample_hbd_420_4x4_c
Line
Count
Source
93
82.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
82.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
82.8k
                                               output_q3, width, height); \
96
82.8k
  }
cfl_subsample_hbd_420_8x8_c
Line
Count
Source
93
88.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
88.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
88.3k
                                               output_q3, width, height); \
96
88.3k
  }
cfl_subsample_hbd_420_16x16_c
Line
Count
Source
93
35.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
35.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
35.8k
                                               output_q3, width, height); \
96
35.8k
  }
cfl_subsample_hbd_420_32x32_c
Line
Count
Source
93
15.7k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
15.7k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
15.7k
                                               output_q3, width, height); \
96
15.7k
  }
cfl_subsample_hbd_420_4x8_c
Line
Count
Source
93
44.6k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
44.6k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
44.6k
                                               output_q3, width, height); \
96
44.6k
  }
cfl_subsample_hbd_420_8x4_c
Line
Count
Source
93
68.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
68.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
68.0k
                                               output_q3, width, height); \
96
68.0k
  }
cfl_subsample_hbd_420_8x16_c
Line
Count
Source
93
26.3k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
26.3k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
26.3k
                                               output_q3, width, height); \
96
26.3k
  }
cfl_subsample_hbd_420_16x8_c
Line
Count
Source
93
44.8k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
44.8k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
44.8k
                                               output_q3, width, height); \
96
44.8k
  }
cfl_subsample_hbd_420_16x32_c
Line
Count
Source
93
7.63k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
7.63k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
7.63k
                                               output_q3, width, height); \
96
7.63k
  }
cfl_subsample_hbd_420_32x16_c
Line
Count
Source
93
9.52k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
9.52k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
9.52k
                                               output_q3, width, height); \
96
9.52k
  }
cfl_subsample_hbd_420_4x16_c
Line
Count
Source
93
68.2k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
68.2k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
68.2k
                                               output_q3, width, height); \
96
68.2k
  }
cfl_subsample_hbd_420_16x4_c
Line
Count
Source
93
74.4k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
74.4k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
74.4k
                                               output_q3, width, height); \
96
74.4k
  }
cfl_subsample_hbd_420_8x32_c
Line
Count
Source
93
12.0k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
12.0k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
12.0k
                                               output_q3, width, height); \
96
12.0k
  }
cfl_subsample_hbd_420_32x8_c
Line
Count
Source
93
13.5k
      const CFL_##bd##_TYPE, int input_stride, uint16_t *output_q3) {     \
94
13.5k
    cfl_luma_subsampling_##sub##_##bd##_##arch(cfl_type, input_stride,    \
95
13.5k
                                               output_q3, width, height); \
96
13.5k
  }
Unexecuted instantiation: cfl_subsample_hbd_422_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_422_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_422_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_422_32x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x8_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_4x16_c
Unexecuted instantiation: cfl_subsample_hbd_444_16x4_c
Unexecuted instantiation: cfl_subsample_hbd_444_8x32_c
Unexecuted instantiation: cfl_subsample_hbd_444_32x8_c
97
98
// Declare size-specific wrappers for all valid CfL sizes.
99
#define CFL_SUBSAMPLE_FUNCTIONS(arch, sub, bd)                            \
100
  CFL_SUBSAMPLE(arch, sub, bd, 4, 4)                                      \
101
  CFL_SUBSAMPLE(arch, sub, bd, 8, 8)                                      \
102
  CFL_SUBSAMPLE(arch, sub, bd, 16, 16)                                    \
103
  CFL_SUBSAMPLE(arch, sub, bd, 32, 32)                                    \
104
  CFL_SUBSAMPLE(arch, sub, bd, 4, 8)                                      \
105
  CFL_SUBSAMPLE(arch, sub, bd, 8, 4)                                      \
106
  CFL_SUBSAMPLE(arch, sub, bd, 8, 16)                                     \
107
  CFL_SUBSAMPLE(arch, sub, bd, 16, 8)                                     \
108
  CFL_SUBSAMPLE(arch, sub, bd, 16, 32)                                    \
109
  CFL_SUBSAMPLE(arch, sub, bd, 32, 16)                                    \
110
  CFL_SUBSAMPLE(arch, sub, bd, 4, 16)                                     \
111
  CFL_SUBSAMPLE(arch, sub, bd, 16, 4)                                     \
112
  CFL_SUBSAMPLE(arch, sub, bd, 8, 32)                                     \
113
  CFL_SUBSAMPLE(arch, sub, bd, 32, 8)                                     \
114
  cfl_subsample_##bd##_fn cfl_get_luma_subsampling_##sub##_##bd##_##arch( \
115
1.70M
      TX_SIZE tx_size) {                                                  \
116
1.70M
    CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
117
1.70M
    return subfn_##sub[tx_size];                                          \
118
1.70M
  }
cfl_get_luma_subsampling_420_lbd_c
Line
Count
Source
115
1.10M
      TX_SIZE tx_size) {                                                  \
116
1.10M
    CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
117
1.10M
    return subfn_##sub[tx_size];                                          \
118
1.10M
  }
Unexecuted instantiation: cfl_get_luma_subsampling_422_lbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_444_lbd_c
cfl_get_luma_subsampling_420_hbd_c
Line
Count
Source
115
592k
      TX_SIZE tx_size) {                                                  \
116
592k
    CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
117
592k
    return subfn_##sub[tx_size];                                          \
118
592k
  }
Unexecuted instantiation: cfl_get_luma_subsampling_422_hbd_c
Unexecuted instantiation: cfl_get_luma_subsampling_444_hbd_c
119
120
// Declare an architecture-specific array of function pointers for size-specific
121
// wrappers.
122
#define CFL_SUBSAMPLE_FUNCTION_ARRAY(arch, sub, bd)                           \
123
1.70M
  static const cfl_subsample_##bd##_fn subfn_##sub[TX_SIZES_ALL] = {          \
124
1.70M
    cfl_subsample_##bd##_##sub##_4x4_##arch,   /* 4x4 */                      \
125
1.70M
    cfl_subsample_##bd##_##sub##_8x8_##arch,   /* 8x8 */                      \
126
1.70M
    cfl_subsample_##bd##_##sub##_16x16_##arch, /* 16x16 */                    \
127
1.70M
    cfl_subsample_##bd##_##sub##_32x32_##arch, /* 32x32 */                    \
128
1.70M
    NULL,                                      /* 64x64 (invalid CFL size) */ \
129
1.70M
    cfl_subsample_##bd##_##sub##_4x8_##arch,   /* 4x8 */                      \
130
1.70M
    cfl_subsample_##bd##_##sub##_8x4_##arch,   /* 8x4 */                      \
131
1.70M
    cfl_subsample_##bd##_##sub##_8x16_##arch,  /* 8x16 */                     \
132
1.70M
    cfl_subsample_##bd##_##sub##_16x8_##arch,  /* 16x8 */                     \
133
1.70M
    cfl_subsample_##bd##_##sub##_16x32_##arch, /* 16x32 */                    \
134
1.70M
    cfl_subsample_##bd##_##sub##_32x16_##arch, /* 32x16 */                    \
135
1.70M
    NULL,                                      /* 32x64 (invalid CFL size) */ \
136
1.70M
    NULL,                                      /* 64x32 (invalid CFL size) */ \
137
1.70M
    cfl_subsample_##bd##_##sub##_4x16_##arch,  /* 4x16  */                    \
138
1.70M
    cfl_subsample_##bd##_##sub##_16x4_##arch,  /* 16x4  */                    \
139
1.70M
    cfl_subsample_##bd##_##sub##_8x32_##arch,  /* 8x32  */                    \
140
1.70M
    cfl_subsample_##bd##_##sub##_32x8_##arch,  /* 32x8  */                    \
141
1.70M
    NULL,                                      /* 16x64 (invalid CFL size) */ \
142
1.70M
    NULL,                                      /* 64x16 (invalid CFL size) */ \
143
1.70M
  };
144
145
// The RTCD script does not support passing in an array, so we wrap it in this
146
// function.
147
#if CONFIG_AV1_HIGHBITDEPTH
148
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
149
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
150
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
151
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd) \
152
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, hbd) \
153
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, hbd) \
154
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, hbd)
155
#else
156
#define CFL_GET_SUBSAMPLE_FUNCTION(arch)  \
157
  CFL_SUBSAMPLE_FUNCTIONS(arch, 420, lbd) \
158
  CFL_SUBSAMPLE_FUNCTIONS(arch, 422, lbd) \
159
  CFL_SUBSAMPLE_FUNCTIONS(arch, 444, lbd)
160
#endif
161
162
// Declare a size-specific wrapper for the size-generic function. The compiler
163
// will inline the size generic function in here, the advantage is that the size
164
// will be constant allowing for loop unrolling and other constant propagated
165
// goodness.
166
#define CFL_SUB_AVG_X(arch, width, height, round_offset, num_pel_log2)       \
167
  void cfl_subtract_average_##width##x##height##_##arch(const uint16_t *src, \
168
927k
                                                        int16_t *dst) {      \
169
927k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
927k
                            num_pel_log2);                                   \
171
927k
  }
cfl_subtract_average_4x4_c
Line
Count
Source
168
314k
                                                        int16_t *dst) {      \
169
314k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
314k
                            num_pel_log2);                                   \
171
314k
  }
cfl_subtract_average_4x8_c
Line
Count
Source
168
150k
                                                        int16_t *dst) {      \
169
150k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
150k
                            num_pel_log2);                                   \
171
150k
  }
cfl_subtract_average_4x16_c
Line
Count
Source
168
32.6k
                                                        int16_t *dst) {      \
169
32.6k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
32.6k
                            num_pel_log2);                                   \
171
32.6k
  }
cfl_subtract_average_8x4_c
Line
Count
Source
168
201k
                                                        int16_t *dst) {      \
169
201k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
201k
                            num_pel_log2);                                   \
171
201k
  }
cfl_subtract_average_8x8_c
Line
Count
Source
168
104k
                                                        int16_t *dst) {      \
169
104k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
104k
                            num_pel_log2);                                   \
171
104k
  }
cfl_subtract_average_8x16_c
Line
Count
Source
168
19.9k
                                                        int16_t *dst) {      \
169
19.9k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
19.9k
                            num_pel_log2);                                   \
171
19.9k
  }
Unexecuted instantiation: cfl_subtract_average_8x32_c
cfl_subtract_average_16x4_c
Line
Count
Source
168
40.4k
                                                        int16_t *dst) {      \
169
40.4k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
40.4k
                            num_pel_log2);                                   \
171
40.4k
  }
cfl_subtract_average_16x8_c
Line
Count
Source
168
24.7k
                                                        int16_t *dst) {      \
169
24.7k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
24.7k
                            num_pel_log2);                                   \
171
24.7k
  }
cfl_subtract_average_16x16_c
Line
Count
Source
168
38.3k
                                                        int16_t *dst) {      \
169
38.3k
    subtract_average_##arch(src, dst, width, height, round_offset,           \
170
38.3k
                            num_pel_log2);                                   \
171
38.3k
  }
Unexecuted instantiation: cfl_subtract_average_16x32_c
Unexecuted instantiation: cfl_subtract_average_32x8_c
Unexecuted instantiation: cfl_subtract_average_32x16_c
Unexecuted instantiation: cfl_subtract_average_32x32_c
172
173
// Declare size-specific wrappers for all valid CfL sizes.
174
#define CFL_SUB_AVG_FN(arch)                                              \
175
  CFL_SUB_AVG_X(arch, 4, 4, 8, 4)                                         \
176
  CFL_SUB_AVG_X(arch, 4, 8, 16, 5)                                        \
177
  CFL_SUB_AVG_X(arch, 4, 16, 32, 6)                                       \
178
  CFL_SUB_AVG_X(arch, 8, 4, 16, 5)                                        \
179
  CFL_SUB_AVG_X(arch, 8, 8, 32, 6)                                        \
180
  CFL_SUB_AVG_X(arch, 8, 16, 64, 7)                                       \
181
  CFL_SUB_AVG_X(arch, 8, 32, 128, 8)                                      \
182
  CFL_SUB_AVG_X(arch, 16, 4, 32, 6)                                       \
183
  CFL_SUB_AVG_X(arch, 16, 8, 64, 7)                                       \
184
  CFL_SUB_AVG_X(arch, 16, 16, 128, 8)                                     \
185
  CFL_SUB_AVG_X(arch, 16, 32, 256, 9)                                     \
186
  CFL_SUB_AVG_X(arch, 32, 8, 128, 8)                                      \
187
  CFL_SUB_AVG_X(arch, 32, 16, 256, 9)                                     \
188
  CFL_SUB_AVG_X(arch, 32, 32, 512, 10)                                    \
189
  cfl_subtract_average_fn cfl_get_subtract_average_fn_##arch(             \
190
927k
      TX_SIZE tx_size) {                                                  \
191
927k
    static const cfl_subtract_average_fn sub_avg[TX_SIZES_ALL] = {        \
192
927k
      cfl_subtract_average_4x4_##arch,   /* 4x4 */                        \
193
927k
      cfl_subtract_average_8x8_##arch,   /* 8x8 */                        \
194
927k
      cfl_subtract_average_16x16_##arch, /* 16x16 */                      \
195
927k
      cfl_subtract_average_32x32_##arch, /* 32x32 */                      \
196
927k
      NULL,                              /* 64x64 (invalid CFL size) */   \
197
927k
      cfl_subtract_average_4x8_##arch,   /* 4x8 */                        \
198
927k
      cfl_subtract_average_8x4_##arch,   /* 8x4 */                        \
199
927k
      cfl_subtract_average_8x16_##arch,  /* 8x16 */                       \
200
927k
      cfl_subtract_average_16x8_##arch,  /* 16x8 */                       \
201
927k
      cfl_subtract_average_16x32_##arch, /* 16x32 */                      \
202
927k
      cfl_subtract_average_32x16_##arch, /* 32x16 */                      \
203
927k
      NULL,                              /* 32x64 (invalid CFL size) */   \
204
927k
      NULL,                              /* 64x32 (invalid CFL size) */   \
205
927k
      cfl_subtract_average_4x16_##arch,  /* 4x16 (invalid CFL size) */    \
206
927k
      cfl_subtract_average_16x4_##arch,  /* 16x4 (invalid CFL size) */    \
207
927k
      cfl_subtract_average_8x32_##arch,  /* 8x32 (invalid CFL size) */    \
208
927k
      cfl_subtract_average_32x8_##arch,  /* 32x8 (invalid CFL size) */    \
209
927k
      NULL,                              /* 16x64 (invalid CFL size) */   \
210
927k
      NULL,                              /* 64x16 (invalid CFL size) */   \
211
927k
    };                                                                    \
212
927k
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */ \
213
927k
    /* index the function pointer array out of bounds. */                 \
214
927k
    return sub_avg[tx_size % TX_SIZES_ALL];                               \
215
927k
  }
216
217
// For VSX SIMD optimization, the C versions of width == 4 subtract are
218
// faster than the VSX. As such, the VSX code calls the C versions.
219
void cfl_subtract_average_4x4_c(const uint16_t *src, int16_t *dst);
220
void cfl_subtract_average_4x8_c(const uint16_t *src, int16_t *dst);
221
void cfl_subtract_average_4x16_c(const uint16_t *src, int16_t *dst);
222
223
#define CFL_PREDICT_lbd(arch, width, height)                              \
224
  void cfl_predict_lbd_##width##x##height##_##arch(                       \
225
      const int16_t *pred_buf_q3, uint8_t *dst, int dst_stride,           \
226
1.24M
      int alpha_q3) {                                                     \
227
1.24M
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
1.24M
                           height);                                       \
229
1.24M
  }
cfl_predict_lbd_4x4_c
Line
Count
Source
226
434k
      int alpha_q3) {                                                     \
227
434k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
434k
                           height);                                       \
229
434k
  }
cfl_predict_lbd_4x8_c
Line
Count
Source
226
206k
      int alpha_q3) {                                                     \
227
206k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
206k
                           height);                                       \
229
206k
  }
cfl_predict_lbd_4x16_c
Line
Count
Source
226
40.6k
      int alpha_q3) {                                                     \
227
40.6k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
40.6k
                           height);                                       \
229
40.6k
  }
cfl_predict_lbd_8x4_c
Line
Count
Source
226
275k
      int alpha_q3) {                                                     \
227
275k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
275k
                           height);                                       \
229
275k
  }
cfl_predict_lbd_8x8_c
Line
Count
Source
226
135k
      int alpha_q3) {                                                     \
227
135k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
135k
                           height);                                       \
229
135k
  }
cfl_predict_lbd_8x16_c
Line
Count
Source
226
24.2k
      int alpha_q3) {                                                     \
227
24.2k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
24.2k
                           height);                                       \
229
24.2k
  }
Unexecuted instantiation: cfl_predict_lbd_8x32_c
cfl_predict_lbd_16x4_c
Line
Count
Source
226
53.0k
      int alpha_q3) {                                                     \
227
53.0k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
53.0k
                           height);                                       \
229
53.0k
  }
cfl_predict_lbd_16x8_c
Line
Count
Source
226
29.8k
      int alpha_q3) {                                                     \
227
29.8k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
29.8k
                           height);                                       \
229
29.8k
  }
cfl_predict_lbd_16x16_c
Line
Count
Source
226
44.0k
      int alpha_q3) {                                                     \
227
44.0k
    cfl_predict_lbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, width, \
228
44.0k
                           height);                                       \
229
44.0k
  }
Unexecuted instantiation: cfl_predict_lbd_16x32_c
Unexecuted instantiation: cfl_predict_lbd_32x8_c
Unexecuted instantiation: cfl_predict_lbd_32x16_c
Unexecuted instantiation: cfl_predict_lbd_32x32_c
230
231
#if CONFIG_AV1_HIGHBITDEPTH
232
#define CFL_PREDICT_hbd(arch, width, height)                                   \
233
  void cfl_predict_hbd_##width##x##height##_##arch(                            \
234
      const int16_t *pred_buf_q3, uint16_t *dst, int dst_stride, int alpha_q3, \
235
612k
      int bd) {                                                                \
236
612k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
612k
                           height);                                            \
238
612k
  }
cfl_predict_hbd_4x4_c
Line
Count
Source
235
195k
      int bd) {                                                                \
236
195k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
195k
                           height);                                            \
238
195k
  }
cfl_predict_hbd_4x8_c
Line
Count
Source
235
94.9k
      int bd) {                                                                \
236
94.9k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
94.9k
                           height);                                            \
238
94.9k
  }
cfl_predict_hbd_4x16_c
Line
Count
Source
235
24.6k
      int bd) {                                                                \
236
24.6k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
24.6k
                           height);                                            \
238
24.6k
  }
cfl_predict_hbd_8x4_c
Line
Count
Source
235
127k
      int bd) {                                                                \
236
127k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
127k
                           height);                                            \
238
127k
  }
cfl_predict_hbd_8x8_c
Line
Count
Source
235
73.2k
      int bd) {                                                                \
236
73.2k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
73.2k
                           height);                                            \
238
73.2k
  }
cfl_predict_hbd_8x16_c
Line
Count
Source
235
15.6k
      int bd) {                                                                \
236
15.6k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
15.6k
                           height);                                            \
238
15.6k
  }
Unexecuted instantiation: cfl_predict_hbd_8x32_c
cfl_predict_hbd_16x4_c
Line
Count
Source
235
27.8k
      int bd) {                                                                \
236
27.8k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
27.8k
                           height);                                            \
238
27.8k
  }
cfl_predict_hbd_16x8_c
Line
Count
Source
235
19.7k
      int bd) {                                                                \
236
19.7k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
19.7k
                           height);                                            \
238
19.7k
  }
cfl_predict_hbd_16x16_c
Line
Count
Source
235
32.7k
      int bd) {                                                                \
236
32.7k
    cfl_predict_hbd_##arch(pred_buf_q3, dst, dst_stride, alpha_q3, bd, width,  \
237
32.7k
                           height);                                            \
238
32.7k
  }
Unexecuted instantiation: cfl_predict_hbd_16x32_c
Unexecuted instantiation: cfl_predict_hbd_32x8_c
Unexecuted instantiation: cfl_predict_hbd_32x16_c
Unexecuted instantiation: cfl_predict_hbd_32x32_c
239
#endif
240
241
// This wrapper exists because clang format does not like calling macros with
242
// lowercase letters.
243
#define CFL_PREDICT_X(arch, width, height, bd) \
244
  CFL_PREDICT_##bd(arch, width, height)
245
246
#define CFL_PREDICT_FN(arch, bd)                                            \
247
  CFL_PREDICT_X(arch, 4, 4, bd)                                             \
248
  CFL_PREDICT_X(arch, 4, 8, bd)                                             \
249
  CFL_PREDICT_X(arch, 4, 16, bd)                                            \
250
  CFL_PREDICT_X(arch, 8, 4, bd)                                             \
251
  CFL_PREDICT_X(arch, 8, 8, bd)                                             \
252
  CFL_PREDICT_X(arch, 8, 16, bd)                                            \
253
  CFL_PREDICT_X(arch, 8, 32, bd)                                            \
254
  CFL_PREDICT_X(arch, 16, 4, bd)                                            \
255
  CFL_PREDICT_X(arch, 16, 8, bd)                                            \
256
  CFL_PREDICT_X(arch, 16, 16, bd)                                           \
257
  CFL_PREDICT_X(arch, 16, 32, bd)                                           \
258
  CFL_PREDICT_X(arch, 32, 8, bd)                                            \
259
  CFL_PREDICT_X(arch, 32, 16, bd)                                           \
260
  CFL_PREDICT_X(arch, 32, 32, bd)                                           \
261
1.85M
  cfl_predict_##bd##_fn cfl_get_predict_##bd##_fn_##arch(TX_SIZE tx_size) { \
262
1.85M
    static const cfl_predict_##bd##_fn pred[TX_SIZES_ALL] = {               \
263
1.85M
      cfl_predict_##bd##_4x4_##arch,   /* 4x4 */                            \
264
1.85M
      cfl_predict_##bd##_8x8_##arch,   /* 8x8 */                            \
265
1.85M
      cfl_predict_##bd##_16x16_##arch, /* 16x16 */                          \
266
1.85M
      cfl_predict_##bd##_32x32_##arch, /* 32x32 */                          \
267
1.85M
      NULL,                            /* 64x64 (invalid CFL size) */       \
268
1.85M
      cfl_predict_##bd##_4x8_##arch,   /* 4x8 */                            \
269
1.85M
      cfl_predict_##bd##_8x4_##arch,   /* 8x4 */                            \
270
1.85M
      cfl_predict_##bd##_8x16_##arch,  /* 8x16 */                           \
271
1.85M
      cfl_predict_##bd##_16x8_##arch,  /* 16x8 */                           \
272
1.85M
      cfl_predict_##bd##_16x32_##arch, /* 16x32 */                          \
273
1.85M
      cfl_predict_##bd##_32x16_##arch, /* 32x16 */                          \
274
1.85M
      NULL,                            /* 32x64 (invalid CFL size) */       \
275
1.85M
      NULL,                            /* 64x32 (invalid CFL size) */       \
276
1.85M
      cfl_predict_##bd##_4x16_##arch,  /* 4x16  */                          \
277
1.85M
      cfl_predict_##bd##_16x4_##arch,  /* 16x4  */                          \
278
1.85M
      cfl_predict_##bd##_8x32_##arch,  /* 8x32  */                          \
279
1.85M
      cfl_predict_##bd##_32x8_##arch,  /* 32x8  */                          \
280
1.85M
      NULL,                            /* 16x64 (invalid CFL size) */       \
281
1.85M
      NULL,                            /* 64x16 (invalid CFL size) */       \
282
1.85M
    };                                                                      \
283
1.85M
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */   \
284
1.85M
    /* index the function pointer array out of bounds. */                   \
285
1.85M
    return pred[tx_size % TX_SIZES_ALL];                                    \
286
1.85M
  }
cfl_get_predict_lbd_fn_c
Line
Count
Source
261
1.24M
  cfl_predict_##bd##_fn cfl_get_predict_##bd##_fn_##arch(TX_SIZE tx_size) { \
262
1.24M
    static const cfl_predict_##bd##_fn pred[TX_SIZES_ALL] = {               \
263
1.24M
      cfl_predict_##bd##_4x4_##arch,   /* 4x4 */                            \
264
1.24M
      cfl_predict_##bd##_8x8_##arch,   /* 8x8 */                            \
265
1.24M
      cfl_predict_##bd##_16x16_##arch, /* 16x16 */                          \
266
1.24M
      cfl_predict_##bd##_32x32_##arch, /* 32x32 */                          \
267
1.24M
      NULL,                            /* 64x64 (invalid CFL size) */       \
268
1.24M
      cfl_predict_##bd##_4x8_##arch,   /* 4x8 */                            \
269
1.24M
      cfl_predict_##bd##_8x4_##arch,   /* 8x4 */                            \
270
1.24M
      cfl_predict_##bd##_8x16_##arch,  /* 8x16 */                           \
271
1.24M
      cfl_predict_##bd##_16x8_##arch,  /* 16x8 */                           \
272
1.24M
      cfl_predict_##bd##_16x32_##arch, /* 16x32 */                          \
273
1.24M
      cfl_predict_##bd##_32x16_##arch, /* 32x16 */                          \
274
1.24M
      NULL,                            /* 32x64 (invalid CFL size) */       \
275
1.24M
      NULL,                            /* 64x32 (invalid CFL size) */       \
276
1.24M
      cfl_predict_##bd##_4x16_##arch,  /* 4x16  */                          \
277
1.24M
      cfl_predict_##bd##_16x4_##arch,  /* 16x4  */                          \
278
1.24M
      cfl_predict_##bd##_8x32_##arch,  /* 8x32  */                          \
279
1.24M
      cfl_predict_##bd##_32x8_##arch,  /* 32x8  */                          \
280
1.24M
      NULL,                            /* 16x64 (invalid CFL size) */       \
281
1.24M
      NULL,                            /* 64x16 (invalid CFL size) */       \
282
1.24M
    };                                                                      \
283
1.24M
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */   \
284
1.24M
    /* index the function pointer array out of bounds. */                   \
285
1.24M
    return pred[tx_size % TX_SIZES_ALL];                                    \
286
1.24M
  }
cfl_get_predict_hbd_fn_c
Line
Count
Source
261
612k
  cfl_predict_##bd##_fn cfl_get_predict_##bd##_fn_##arch(TX_SIZE tx_size) { \
262
612k
    static const cfl_predict_##bd##_fn pred[TX_SIZES_ALL] = {               \
263
612k
      cfl_predict_##bd##_4x4_##arch,   /* 4x4 */                            \
264
612k
      cfl_predict_##bd##_8x8_##arch,   /* 8x8 */                            \
265
612k
      cfl_predict_##bd##_16x16_##arch, /* 16x16 */                          \
266
612k
      cfl_predict_##bd##_32x32_##arch, /* 32x32 */                          \
267
612k
      NULL,                            /* 64x64 (invalid CFL size) */       \
268
612k
      cfl_predict_##bd##_4x8_##arch,   /* 4x8 */                            \
269
612k
      cfl_predict_##bd##_8x4_##arch,   /* 8x4 */                            \
270
612k
      cfl_predict_##bd##_8x16_##arch,  /* 8x16 */                           \
271
612k
      cfl_predict_##bd##_16x8_##arch,  /* 16x8 */                           \
272
612k
      cfl_predict_##bd##_16x32_##arch, /* 16x32 */                          \
273
612k
      cfl_predict_##bd##_32x16_##arch, /* 32x16 */                          \
274
612k
      NULL,                            /* 32x64 (invalid CFL size) */       \
275
612k
      NULL,                            /* 64x32 (invalid CFL size) */       \
276
612k
      cfl_predict_##bd##_4x16_##arch,  /* 4x16  */                          \
277
612k
      cfl_predict_##bd##_16x4_##arch,  /* 16x4  */                          \
278
612k
      cfl_predict_##bd##_8x32_##arch,  /* 8x32  */                          \
279
612k
      cfl_predict_##bd##_32x8_##arch,  /* 32x8  */                          \
280
612k
      NULL,                            /* 16x64 (invalid CFL size) */       \
281
612k
      NULL,                            /* 64x16 (invalid CFL size) */       \
282
612k
    };                                                                      \
283
612k
    /* Modulo TX_SIZES_ALL to ensure that an attacker won't be able to */   \
284
612k
    /* index the function pointer array out of bounds. */                   \
285
612k
    return pred[tx_size % TX_SIZES_ALL];                                    \
286
612k
  }
287
288
#endif  // AOM_AV1_COMMON_CFL_H_