Coverage Report

Created: 2026-06-30 07:53

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/libjxl/lib/jxl/dct_block-inl.h
Line
Count
Source
1
// Copyright (c) the JPEG XL Project Authors. All rights reserved.
2
//
3
// Use of this source code is governed by a BSD-style
4
// license that can be found in the LICENSE file.
5
6
// Adapters for DCT input/output: from/to contiguous blocks or image rows.
7
8
#include "lib/jxl/base/compiler_specific.h"
9
10
#if defined(LIB_JXL_DCT_BLOCK_INL_H_) == defined(HWY_TARGET_TOGGLE)
11
#ifdef LIB_JXL_DCT_BLOCK_INL_H_
12
#undef LIB_JXL_DCT_BLOCK_INL_H_
13
#else
14
#define LIB_JXL_DCT_BLOCK_INL_H_
15
#endif
16
17
#include <cstddef>
18
#include <hwy/highway.h>
19
20
#include "lib/jxl/base/status.h"
21
22
HWY_BEFORE_NAMESPACE();
23
namespace jxl {
24
namespace HWY_NAMESPACE {
25
namespace {
26
27
// These templates are not found via ADL.
28
using hwy::HWY_NAMESPACE::Vec;
29
30
// Block: (x, y) <-> (N * y + x)
31
// Lines: (x, y) <-> (stride * y + x)
32
//
33
// I.e. Block is a specialization of Lines with fixed stride.
34
//
35
// FromXXX should implement Read and Load (Read vector).
36
// ToXXX should implement Write and Store (Write vector).
37
38
template <size_t N>
39
using BlockDesc = HWY_CAPPED(float, N);
40
41
// Here and in the following, the SZ template parameter specifies the number of
42
// values to load/store. Needed because we want to handle 4x4 sub-blocks of
43
// 16x16 blocks.
44
class DCTFrom {
45
 public:
46
80.5M
  DCTFrom(const float* data, size_t stride) : stride_(stride), data_(data) {}
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Line
Count
Source
46
24.3M
  DCTFrom(const float* data, size_t stride) : stride_(stride), data_(data) {}
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Line
Count
Source
46
24.0M
  DCTFrom(const float* data, size_t stride) : stride_(stride), data_(data) {}
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Line
Count
Source
46
32.0M
  DCTFrom(const float* data, size_t stride) : stride_(stride), data_(data) {}
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Line
Count
Source
46
119k
  DCTFrom(const float* data, size_t stride) : stride_(stride), data_(data) {}
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Line
Count
Source
46
3.15k
  DCTFrom(const float* data, size_t stride) : stride_(stride), data_(data) {}
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::DCTFrom(float const*, unsigned long)
47
48
  template <typename D>
49
596M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
596M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
596M
    return LoadU(D(), Address(row, i));
56
596M
  }
dec_group.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
201M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
201M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
201M
    return LoadU(D(), Address(row, i));
56
201M
  }
dec_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
101M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
101M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
101M
    return LoadU(D(), Address(row, i));
56
101M
  }
dec_group.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
264M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
264M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
264M
    return LoadU(D(), Address(row, i));
56
264M
  }
dec_group.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
5.83M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
5.83M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
5.83M
    return LoadU(D(), Address(row, i));
56
5.83M
  }
dec_group.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
2.95M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
2.95M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
2.95M
    return LoadU(D(), Address(row, i));
56
2.95M
  }
dec_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
5.75M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
5.75M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
5.75M
    return LoadU(D(), Address(row, i));
56
5.75M
  }
dec_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
2.90M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
2.90M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
2.90M
    return LoadU(D(), Address(row, i));
56
2.90M
  }
dec_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
25.0k
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
25.0k
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
25.0k
    return LoadU(D(), Address(row, i));
56
25.0k
  }
dec_group.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
7.67M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
7.67M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
7.67M
    return LoadU(D(), Address(row, i));
56
7.67M
  }
dec_group.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
3.85M
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
3.85M
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
3.85M
    return LoadU(D(), Address(row, i));
56
3.85M
  }
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
enc_ac_strategy.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
134k
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
134k
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
134k
    return LoadU(D(), Address(row, i));
56
134k
  }
enc_ac_strategy.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
67.2k
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
67.2k
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
67.2k
    return LoadU(D(), Address(row, i));
56
67.2k
  }
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
enc_chroma_from_luma.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, unsigned long, unsigned long) const
Line
Count
Source
49
25.2k
  HWY_INLINE Vec<D> LoadPart(D /* tag */, const size_t row, size_t i) const {
50
25.2k
    JXL_DASSERT(Lanes(D()) <= stride_);
51
    // Since these functions are used also for DC, no alignment at all is
52
    // guaranteed in the case of floating blocks.
53
    // TODO(veluca): consider using a different class for DC-to-LF and
54
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
55
25.2k
    return LoadU(D(), Address(row, i));
56
25.2k
  }
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) jxl::N_SSE4::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) jxl::N_AVX2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) jxl::N_SSE2::(anonymous namespace)::DCTFrom::LoadPart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, unsigned long, unsigned long) const
57
58
43.9M
  HWY_INLINE float Read(const size_t row, const size_t i) const {
59
43.9M
    return *Address(row, i);
60
43.9M
  }
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Line
Count
Source
58
15.7M
  HWY_INLINE float Read(const size_t row, const size_t i) const {
59
15.7M
    return *Address(row, i);
60
15.7M
  }
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Line
Count
Source
58
11.6M
  HWY_INLINE float Read(const size_t row, const size_t i) const {
59
11.6M
    return *Address(row, i);
60
11.6M
  }
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Line
Count
Source
58
15.2M
  HWY_INLINE float Read(const size_t row, const size_t i) const {
59
15.2M
    return *Address(row, i);
60
15.2M
  }
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Line
Count
Source
58
1.20M
  HWY_INLINE float Read(const size_t row, const size_t i) const {
59
1.20M
    return *Address(row, i);
60
1.20M
  }
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Read(unsigned long, unsigned long) const
61
62
  constexpr HWY_INLINE const float* Address(const size_t row,
63
693M
                                            const size_t i) const {
64
693M
    return data_ + row * stride_ + i;
65
693M
  }
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Line
Count
Source
63
233M
                                            const size_t i) const {
64
233M
    return data_ + row * stride_ + i;
65
233M
  }
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Line
Count
Source
63
140M
                                            const size_t i) const {
64
140M
    return data_ + row * stride_ + i;
65
140M
  }
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Line
Count
Source
63
317M
                                            const size_t i) const {
64
317M
    return data_ + row * stride_ + i;
65
317M
  }
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Line
Count
Source
63
1.49M
                                            const size_t i) const {
64
1.49M
    return data_ + row * stride_ + i;
65
1.49M
  }
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
Line
Count
Source
63
26.2k
                                            const size_t i) const {
64
26.2k
    return data_ + row * stride_ + i;
65
26.2k
  }
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Address(unsigned long, unsigned long) const
66
67
54.2M
  size_t Stride() const { return stride_; }
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Stride() const
Line
Count
Source
67
19.1M
  size_t Stride() const { return stride_; }
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Stride() const
Line
Count
Source
67
9.99M
  size_t Stride() const { return stride_; }
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Stride() const
Line
Count
Source
67
25.0M
  size_t Stride() const { return stride_; }
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Stride() const
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Stride() const
Line
Count
Source
67
35.7k
  size_t Stride() const { return stride_; }
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTFrom::Stride() const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTFrom::Stride() const
68
69
 private:
70
  size_t stride_;
71
  const float* JXL_RESTRICT data_;
72
};
73
74
class DCTTo {
75
 public:
76
80.9M
  DCTTo(float* data, size_t stride) : stride_(stride), data_(data) {}
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Line
Count
Source
76
24.4M
  DCTTo(float* data, size_t stride) : stride_(stride), data_(data) {}
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Line
Count
Source
76
24.2M
  DCTTo(float* data, size_t stride) : stride_(stride), data_(data) {}
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Line
Count
Source
76
32.1M
  DCTTo(float* data, size_t stride) : stride_(stride), data_(data) {}
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Line
Count
Source
76
119k
  DCTTo(float* data, size_t stride) : stride_(stride), data_(data) {}
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Line
Count
Source
76
3.15k
  DCTTo(float* data, size_t stride) : stride_(stride), data_(data) {}
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::DCTTo(float*, unsigned long)
77
78
  template <typename D>
79
  HWY_INLINE void StorePart(D /* tag */, const Vec<D>& v, const size_t row,
80
595M
                            size_t i) const {
81
595M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
595M
    StoreU(v, D(), Address(row, i));
87
595M
  }
dec_group.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
201M
                            size_t i) const {
81
201M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
201M
    StoreU(v, D(), Address(row, i));
87
201M
  }
dec_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
101M
                            size_t i) const {
81
101M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
101M
    StoreU(v, D(), Address(row, i));
87
101M
  }
dec_group.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
263M
                            size_t i) const {
81
263M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
263M
    StoreU(v, D(), Address(row, i));
87
263M
  }
dec_group.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
5.82M
                            size_t i) const {
81
5.82M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
5.82M
    StoreU(v, D(), Address(row, i));
87
5.82M
  }
dec_group.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
2.95M
                            size_t i) const {
81
2.95M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
2.95M
    StoreU(v, D(), Address(row, i));
87
2.95M
  }
dec_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
5.74M
                            size_t i) const {
81
5.74M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
5.74M
    StoreU(v, D(), Address(row, i));
87
5.74M
  }
dec_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
2.90M
                            size_t i) const {
81
2.90M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
2.90M
    StoreU(v, D(), Address(row, i));
87
2.90M
  }
dec_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
25.0k
                            size_t i) const {
81
25.0k
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
25.0k
    StoreU(v, D(), Address(row, i));
87
25.0k
  }
dec_group.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
7.67M
                            size_t i) const {
81
7.67M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
7.67M
    StoreU(v, D(), Address(row, i));
87
7.67M
  }
dec_group.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
3.85M
                            size_t i) const {
81
3.85M
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
3.85M
    StoreU(v, D(), Address(row, i));
87
3.85M
  }
Unexecuted instantiation: enc_group.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
enc_ac_strategy.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
134k
                            size_t i) const {
81
134k
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
134k
    StoreU(v, D(), Address(row, i));
87
134k
  }
enc_ac_strategy.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
67.2k
                            size_t i) const {
81
67.2k
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
67.2k
    StoreU(v, D(), Address(row, i));
87
67.2k
  }
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 4ul, 0> >(hwy::N_SSE4::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 4ul, 0> >(hwy::N_AVX2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
enc_chroma_from_luma.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 8ul, 0> >(hwy::N_AVX2::Simd<float, 8ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 8ul, 0>)())) const&, unsigned long, unsigned long) const
Line
Count
Source
80
25.2k
                            size_t i) const {
81
25.2k
    JXL_DASSERT(Lanes(D()) <= stride_);
82
    // Since these functions are used also for DC, no alignment at all is
83
    // guaranteed in the case of floating blocks.
84
    // TODO(veluca): consider using a different class for DC-to-LF and
85
    // DC-from-LF, or copying DC values to/from a temporary aligned location.
86
25.2k
    StoreU(v, D(), Address(row, i));
87
25.2k
  }
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 4ul, 0> >(hwy::N_SSE2::Simd<float, 4ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 4ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 1ul, 0> >(hwy::N_SSE4::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_SSE4::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE4::Simd<float, 2ul, 0> >(hwy::N_SSE4::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE4::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 1ul, 0> >(hwy::N_AVX2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_AVX2::(anonymous namespace)::DCTTo::StorePart<hwy::N_AVX2::Simd<float, 2ul, 0> >(hwy::N_AVX2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_AVX2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 1ul, 0> >(hwy::N_SSE2::Simd<float, 1ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 1ul, 0>)())) const&, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:void jxl::N_SSE2::(anonymous namespace)::DCTTo::StorePart<hwy::N_SSE2::Simd<float, 2ul, 0> >(hwy::N_SSE2::Simd<float, 2ul, 0>, decltype (Zero((hwy::N_SSE2::Simd<float, 2ul, 0>)())) const&, unsigned long, unsigned long) const
88
89
43.9M
  HWY_INLINE void Write(float v, const size_t row, const size_t i) const {
90
43.9M
    *Address(row, i) = v;
91
43.9M
  }
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Line
Count
Source
89
15.7M
  HWY_INLINE void Write(float v, const size_t row, const size_t i) const {
90
15.7M
    *Address(row, i) = v;
91
15.7M
  }
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Line
Count
Source
89
11.6M
  HWY_INLINE void Write(float v, const size_t row, const size_t i) const {
90
11.6M
    *Address(row, i) = v;
91
11.6M
  }
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Line
Count
Source
89
15.2M
  HWY_INLINE void Write(float v, const size_t row, const size_t i) const {
90
15.2M
    *Address(row, i) = v;
91
15.2M
  }
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Line
Count
Source
89
1.20M
  HWY_INLINE void Write(float v, const size_t row, const size_t i) const {
90
1.20M
    *Address(row, i) = v;
91
1.20M
  }
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Write(float, unsigned long, unsigned long) const
92
93
693M
  constexpr HWY_INLINE float* Address(const size_t row, const size_t i) const {
94
693M
    return data_ + row * stride_ + i;
95
693M
  }
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Line
Count
Source
93
233M
  constexpr HWY_INLINE float* Address(const size_t row, const size_t i) const {
94
233M
    return data_ + row * stride_ + i;
95
233M
  }
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Line
Count
Source
93
141M
  constexpr HWY_INLINE float* Address(const size_t row, const size_t i) const {
94
141M
    return data_ + row * stride_ + i;
95
141M
  }
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Line
Count
Source
93
317M
  constexpr HWY_INLINE float* Address(const size_t row, const size_t i) const {
94
317M
    return data_ + row * stride_ + i;
95
317M
  }
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Line
Count
Source
93
1.49M
  constexpr HWY_INLINE float* Address(const size_t row, const size_t i) const {
94
1.49M
    return data_ + row * stride_ + i;
95
1.49M
  }
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
Line
Count
Source
93
26.2k
  constexpr HWY_INLINE float* Address(const size_t row, const size_t i) const {
94
26.2k
    return data_ + row * stride_ + i;
95
26.2k
  }
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Address(unsigned long, unsigned long) const
96
97
54.2M
  size_t Stride() const { return stride_; }
dec_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Stride() const
Line
Count
Source
97
19.1M
  size_t Stride() const { return stride_; }
dec_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Stride() const
Line
Count
Source
97
9.99M
  size_t Stride() const { return stride_; }
dec_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Stride() const
Line
Count
Source
97
25.0M
  size_t Stride() const { return stride_; }
Unexecuted instantiation: enc_group.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_group.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_group.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Stride() const
enc_ac_strategy.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Stride() const
Line
Count
Source
97
35.7k
  size_t Stride() const { return stride_; }
Unexecuted instantiation: enc_ac_strategy.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_adaptive_quantization.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE4::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_AVX2::(anonymous namespace)::DCTTo::Stride() const
Unexecuted instantiation: enc_chroma_from_luma.cc:jxl::N_SSE2::(anonymous namespace)::DCTTo::Stride() const
98
99
 private:
100
  size_t stride_;
101
  float* JXL_RESTRICT data_;
102
};
103
104
}  // namespace
105
// NOLINTNEXTLINE(google-readability-namespace-comments)
106
}  // namespace HWY_NAMESPACE
107
}  // namespace jxl
108
HWY_AFTER_NAMESPACE();
109
110
#endif  // LIB_JXL_DCT_BLOCK_INL_H_