/src/libjxl/lib/jxl/lehmer_code.h
Line | Count | Source |
1 | | // Copyright (c) the JPEG XL Project Authors. All rights reserved. |
2 | | // |
3 | | // Use of this source code is governed by a BSD-style |
4 | | // license that can be found in the LICENSE file. |
5 | | |
6 | | #ifndef LIB_JXL_LEHMER_CODE_H_ |
7 | | #define LIB_JXL_LEHMER_CODE_H_ |
8 | | |
9 | | #include <stddef.h> |
10 | | #include <stdint.h> |
11 | | |
12 | | #include "lib/jxl/base/bits.h" |
13 | | #include "lib/jxl/base/compiler_specific.h" |
14 | | #include "lib/jxl/base/status.h" |
15 | | |
16 | | namespace jxl { |
17 | | |
18 | | // Permutation <=> factorial base representation (Lehmer code). |
19 | | |
20 | | using LehmerT = uint32_t; |
21 | | |
22 | | template <typename T> |
23 | 2.27M | constexpr T ValueOfLowest1Bit(T t) { |
24 | 2.27M | return t & -t; |
25 | 2.27M | } unsigned int jxl::ValueOfLowest1Bit<unsigned int>(unsigned int) Line | Count | Source | 23 | 1.65M | constexpr T ValueOfLowest1Bit(T t) { | 24 | 1.65M | return t & -t; | 25 | 1.65M | } |
int jxl::ValueOfLowest1Bit<int>(int) Line | Count | Source | 23 | 124k | constexpr T ValueOfLowest1Bit(T t) { | 24 | 124k | return t & -t; | 25 | 124k | } |
unsigned long jxl::ValueOfLowest1Bit<unsigned long>(unsigned long) Line | Count | Source | 23 | 498k | constexpr T ValueOfLowest1Bit(T t) { | 24 | 498k | return t & -t; | 25 | 498k | } |
|
26 | | |
27 | | // Computes the Lehmer (factorial basis) code of permutation, an array of n |
28 | | // unique indices in [0..n), and stores it in code[0..len). N*logN time. |
29 | | // temp must have n + 1 elements but need not be initialized. |
30 | | template <typename PermutationT> |
31 | | Status ComputeLehmerCode(const PermutationT* JXL_RESTRICT permutation, |
32 | | uint32_t* JXL_RESTRICT temp, const size_t n, |
33 | 1.50k | LehmerT* JXL_RESTRICT code) { |
34 | 318k | for (size_t idx = 0; idx < n + 1; ++idx) temp[idx] = 0; |
35 | | |
36 | 316k | for (size_t idx = 0; idx < n; ++idx) { |
37 | 315k | const PermutationT s = permutation[idx]; |
38 | | |
39 | | // Compute sum in Fenwick tree |
40 | 315k | uint32_t penalty = 0; |
41 | 315k | uint32_t i = s + 1; |
42 | 1.65M | while (i != 0) { |
43 | 1.33M | penalty += temp[i]; |
44 | 1.33M | i &= i - 1; // clear lowest bit |
45 | 1.33M | } |
46 | 315k | JXL_ENSURE(s >= penalty); |
47 | 315k | code[idx] = s - penalty; |
48 | 315k | i = s + 1; |
49 | | // Add operation in Fenwick tree |
50 | 1.96M | while (i < n + 1) { |
51 | 1.65M | temp[i] += 1; |
52 | 1.65M | i += ValueOfLowest1Bit(i); |
53 | 1.65M | } |
54 | 315k | } |
55 | 1.50k | return true; |
56 | 1.50k | } |
57 | | |
58 | | // Decodes the Lehmer code in code[0..n) into permutation[0..n). |
59 | | // temp must have 1 << CeilLog2(n) elements but need not be initialized. |
60 | | template <typename PermutationT> |
61 | | Status DecodeLehmerCode(const LehmerT* JXL_RESTRICT code, |
62 | | uint32_t* JXL_RESTRICT temp, size_t n, |
63 | 9.73k | PermutationT* JXL_RESTRICT permutation) { |
64 | 9.73k | JXL_ENSURE(n != 0); |
65 | 9.73k | const size_t log2n = CeilLog2Nonzero(n); |
66 | 9.73k | const size_t padded_n = 1ull << log2n; |
67 | | |
68 | 133k | for (size_t i = 0; i < padded_n; i++) { |
69 | 124k | const int32_t i1 = static_cast<int32_t>(i + 1); |
70 | 124k | temp[i] = static_cast<uint32_t>(ValueOfLowest1Bit(i1)); |
71 | 124k | } |
72 | | |
73 | 125k | for (size_t i = 0; i < n; i++) { |
74 | 115k | JXL_ENSURE(code[i] + i < n); |
75 | 115k | uint32_t rank = code[i] + 1; |
76 | | |
77 | | // Extract i-th unused element via implicit order-statistics tree. |
78 | 115k | size_t bit = padded_n; |
79 | 115k | size_t next = 0; |
80 | 983k | for (size_t b = 0; b <= log2n; b++) { |
81 | 867k | const size_t cand = next + bit; |
82 | 867k | JXL_ENSURE(cand >= 1); |
83 | 867k | bit >>= 1; |
84 | 867k | if (temp[cand - 1] < rank) { |
85 | 369k | next = cand; |
86 | 369k | rank -= temp[cand - 1]; |
87 | 369k | } |
88 | 867k | } |
89 | | |
90 | 115k | permutation[i] = next; |
91 | | |
92 | | // Mark as used |
93 | 115k | next += 1; |
94 | 614k | while (next <= padded_n) { |
95 | 498k | temp[next - 1] -= 1; |
96 | 498k | next += ValueOfLowest1Bit(next); |
97 | 498k | } |
98 | 115k | } |
99 | 9.73k | return true; |
100 | 9.73k | } |
101 | | |
102 | | } // namespace jxl |
103 | | |
104 | | #endif // LIB_JXL_LEHMER_CODE_H_ |