Coverage Report

Created: 2026-06-10 07:00

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/work/vvenc/source/Lib/CommonLib/Quant.cpp
Line
Count
Source
1
/* -----------------------------------------------------------------------------
2
The copyright in this software is being made available under the Clear BSD
3
License, included below. No patent rights, trademark rights and/or 
4
other Intellectual Property Rights other than the copyrights concerning 
5
the Software are granted under this license.
6
7
The Clear BSD License
8
9
Copyright (c) 2019-2026, Fraunhofer-Gesellschaft zur Förderung der angewandten Forschung e.V. & The VVenC Authors.
10
All rights reserved.
11
12
Redistribution and use in source and binary forms, with or without modification,
13
are permitted (subject to the limitations in the disclaimer below) provided that
14
the following conditions are met:
15
16
     * Redistributions of source code must retain the above copyright notice,
17
     this list of conditions and the following disclaimer.
18
19
     * Redistributions in binary form must reproduce the above copyright
20
     notice, this list of conditions and the following disclaimer in the
21
     documentation and/or other materials provided with the distribution.
22
23
     * Neither the name of the copyright holder nor the names of its
24
     contributors may be used to endorse or promote products derived from this
25
     software without specific prior written permission.
26
27
NO EXPRESS OR IMPLIED LICENSES TO ANY PARTY'S PATENT RIGHTS ARE GRANTED BY
28
THIS LICENSE. THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND
29
CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
30
LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A
31
PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR
32
CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
33
EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
34
PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
35
BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER
36
IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
37
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
38
POSSIBILITY OF SUCH DAMAGE.
39
40
41
------------------------------------------------------------------------------------------- */
42
43
44
/** \file     Quant.cpp
45
    \brief    transform and quantization class
46
*/
47
48
#include "Quant.h"
49
#include "UnitTools.h"
50
#include "ContextModelling.h"
51
#include "CodingStructure.h"
52
#include "dtrace_buffer.h"
53
54
#include <stdlib.h>
55
#include <memory.h>
56
57
//! \ingroup CommonLib
58
//! \{
59
60
namespace vvenc {
61
62
// ====================================================================================================================
63
// Constants
64
// ====================================================================================================================
65
66
67
// ====================================================================================================================
68
// QpParam constructor
69
// ====================================================================================================================
70
 
71
QpParam::QpParam(const TransformUnit& tu, const ComponentID &compID, const bool allowACTQpoffset)
72
5.81M
{
73
5.81M
  const ChannelType chType = toChannelType( compID );
74
5.81M
  const SPS        &sps    = *tu.cu->cs->sps;
75
5.81M
  const int     qpBdOffset = sps.qpBDOffset[chType];
76
5.81M
  const bool useJQP        = isChroma( compID ) && abs( TU::getICTMode( tu ) ) == 2;
77
5.81M
  const ComponentID jCbCr  = useJQP ? COMP_JOINT_CbCr : compID;
78
  
79
5.81M
        int chromaQpOffset = 0;
80
81
5.81M
  if( isChroma( compID ) )
82
5.61M
  {
83
5.61M
    const PPS &pps  = *tu.cu->slice->pps;
84
5.61M
    chromaQpOffset  = pps.chromaQpOffset              [jCbCr];
85
5.61M
    chromaQpOffset += tu.cu->slice->sliceChromaQpDelta[jCbCr];
86
5.61M
    chromaQpOffset += pps.getChromaQpOffsetListEntry( tu.cu->chromaQpAdj ).u.offset[int( jCbCr ) - 1];
87
5.61M
  }
88
  
89
5.81M
  int baseQp;
90
5.81M
  int qpy        = tu.cu->qp;
91
  //bool skip      = tu.mtsIdx[compID] == MTS_SKIP;
92
93
5.81M
  if( isLuma( compID ) )
94
200k
  {
95
200k
    baseQp = tu.cu->qp + qpBdOffset;
96
200k
  }
97
5.61M
  else
98
5.61M
  {
99
5.61M
    int qpi = Clip3( -qpBdOffset, MAX_QP, qpy );
100
5.61M
    baseQp  = sps.chromaQpMappingTable.getMappedChromaQpValue( jCbCr, qpi );
101
5.61M
    baseQp  = Clip3( -qpBdOffset, MAX_QP, baseQp + chromaQpOffset ) + qpBdOffset;
102
5.61M
  }
103
104
5.81M
  if( allowACTQpoffset && tu.cu->colorTransform )
105
0
  {
106
0
    baseQp += DELTA_QP_ACT[jCbCr];
107
0
  }
108
109
5.81M
  baseQp = Clip3( 0, MAX_QP + qpBdOffset, baseQp );
110
111
  //if( !skip )
112
5.81M
  {
113
5.81M
    Qps [0] = baseQp;
114
5.81M
    pers[0] = baseQp / 6;
115
5.81M
    rems[0] = baseQp % 6;
116
5.81M
  }
117
  //else
118
5.81M
  {
119
5.81M
    int internalMinusInputBitDepth = sps.internalMinusInputBitDepth[chType];
120
5.81M
    int baseQpTS           = std::max( baseQp, 4 + 6 * internalMinusInputBitDepth );
121
122
5.81M
    Qps [1] = baseQpTS;
123
5.81M
    pers[1] = baseQpTS / 6;
124
5.81M
    rems[1] = baseQpTS % 6;
125
5.81M
  }
126
5.81M
}
127
128
129
// ====================================================================================================================
130
// Quant class member functions
131
// ====================================================================================================================
132
static void QuantCore(const TransformUnit tu, const ComponentID compID, const CCoeffBuf& piCoef,CoeffSigBuf piQCoef,TCoeff &uiAbsSum, int &lastScanPos,TCoeff *deltaU,const int defaultQuantisationCoefficient,const int iQBits,const int64_t iAdd,const TCoeff entropyCodingMinimum,const TCoeff entropyCodingMaximum,const bool signHiding, const TCoeff m_thrVal)
133
5.24k
{
134
5.24k
  CoeffCodingContext cctx( tu, compID, signHiding );
135
136
5.24k
  const CompArea &rect      = tu.blocks[compID];
137
5.24k
  const uint32_t uiWidth    = rect.width;
138
5.24k
  const uint32_t uiHeight   = rect.height;
139
140
  /* for 422 chroma blocks, the effective scaling applied during transformation is not a power of 2, hence it cannot be
141
  * implemented as a bit-shift (the quantised result will be sqrt(2) * larger than required). Alternatively, adjust the
142
  * uiLog2TrSize applied in iTransformShift, such that the result is 1/sqrt(2) the required result (i.e. smaller)
143
  * Then a QP+3 (sqrt(2)) or QP-3 (1/sqrt(2)) method could be used to get the required result
144
  */
145
146
5.24k
  const uint32_t log2CGSize         = cctx.log2CGSize();
147
148
5.24k
  uiAbsSum = 0;
149
150
5.24k
  const int iCGSize   = 1 << log2CGSize;
151
152
5.24k
  const uint32_t lfnstIdx = tu.cu->lfnstIdx;
153
5.24k
  const int iCGNum   = lfnstIdx > 0 ? 1 : std::min<int>(JVET_C0024_ZERO_OUT_TH, uiWidth) * std::min<int>(JVET_C0024_ZERO_OUT_TH, uiHeight) >> cctx.log2CGSize();
154
5.24k
  int       iScanPos = ( iCGNum << log2CGSize ) - 1;
155
156
5.24k
  if( lfnstIdx > 0 && ( ( uiWidth == 4 && uiHeight == 4 ) || ( uiWidth == 8 && uiHeight == 8 ) ) )
157
0
  {
158
0
    iScanPos = 7;
159
0
  }
160
161
  // Find first non-zero coeff
162
29.6k
  for( ; iScanPos > 0; iScanPos-- )
163
28.3k
  {
164
28.3k
    uint32_t uiBlkPos = cctx.blockPos( iScanPos );
165
28.3k
    if( piCoef.buf[uiBlkPos] )
166
3.92k
      break;
167
28.3k
  }
168
169
  //////////////////////////////////////////////////////////////////////////
170
  //  Loop over sub-sets (coefficient groups)
171
  //////////////////////////////////////////////////////////////////////////
172
  
173
5.24k
  TCoeff thres = 0, useThres = 0;
174
  
175
5.24k
  if( iQBits )
176
5.24k
    thres = TCoeff( ( int64_t( m_thrVal ) << ( iQBits - 1 ) ) );
177
0
  else
178
0
    thres = TCoeff( ( int64_t( m_thrVal >> 1 ) << iQBits ) );
179
180
5.24k
  useThres = thres / ( defaultQuantisationCoefficient << 2 );
181
182
5.24k
  const bool is4x4sbb = log2CGSize == 4 && cctx.log2CGWidth() == 2;
183
184
5.24k
  int subSetId = iScanPos >> log2CGSize;
185
6.04k
  for( ; subSetId >= 1; subSetId-- )
186
803
  {
187
803
    if( is4x4sbb && iScanPos >= 16 )
188
0
    {
189
0
      int  iScanPosinCG = iScanPos & ( iCGSize - 1 );
190
0
      bool allSmaller   = true;
191
192
0
      for( int xScanPosinCG = iScanPosinCG, xScanPos = iScanPos; allSmaller && xScanPosinCG >= 0; xScanPosinCG--, xScanPos-- )
193
0
      {
194
0
        const uint32_t uiBlkPos = cctx.blockPos( xScanPos );
195
0
        allSmaller &= abs( piCoef.buf[uiBlkPos] ) <= useThres;
196
0
      }
197
198
0
      if( allSmaller )
199
0
      {
200
0
        iScanPos    -= iScanPosinCG + 1;
201
0
        continue;
202
0
      }
203
0
      else
204
0
      {
205
0
        break;
206
0
      }
207
0
    }
208
803
  }
209
210
5.24k
  const int qBits8 = iQBits - 8;
211
5.24k
  piQCoef.memset( 0 );
212
213
82.1k
  for( int currPos = 0; currPos <= iScanPos; currPos++ )
214
76.9k
  {
215
76.9k
    const int uiBlockPos  = cctx.blockPos( currPos );
216
76.9k
    const TCoeff iLevel   = piCoef.buf[uiBlockPos];
217
76.9k
    const TCoeff iSign    = (iLevel < 0 ? -1: 1);
218
219
76.9k
    const int64_t  tmpLevel = (int64_t)abs(iLevel) * defaultQuantisationCoefficient;
220
76.9k
    const TCoeff quantisedMagnitude = TCoeff((tmpLevel + iAdd ) >> iQBits);
221
76.9k
    deltaU[uiBlockPos] = (TCoeff)((tmpLevel - ((int64_t)quantisedMagnitude<<iQBits) )>> qBits8);
222
223
76.9k
    uiAbsSum += quantisedMagnitude;
224
76.9k
    const TCoeff quantisedCoefficient = quantisedMagnitude * iSign;
225
226
76.9k
    piQCoef.buf[uiBlockPos] = Clip3<TCoeff>( entropyCodingMinimum, entropyCodingMaximum, quantisedCoefficient );
227
76.9k
  } // for n
228
229
5.24k
  lastScanPos = iScanPos;
230
5.24k
}
231
232
static void DeQuantCore(const int maxX,const int maxY,const int scale,const TCoeffSig* const piQCoef,const size_t piQCfStride,TCoeff   *const piCoef,const int rightShift,const int inputMaximum,const TCoeff transformMaximum)
233
44.3k
{
234
44.3k
  const int inputMinimum = -(inputMaximum+1);
235
44.3k
  const TCoeff transformMinimum = -(transformMaximum+1);
236
44.3k
  if (rightShift>0)
237
34.8k
  {
238
34.8k
    const Intermediate_Int iAdd = (Intermediate_Int) 1 << (rightShift - 1);
239
330k
    for( int y = 0, n = 0; y <= maxY; y++)
240
296k
    {
241
3.17M
      for( int x = 0; x <= maxX; x++, n++ )
242
2.87M
      {
243
2.87M
        const TCoeff           clipQCoef = TCoeff(Clip3<Intermediate_Int>(inputMinimum, inputMaximum, piQCoef[x + y * piQCfStride]));
244
2.87M
        Intermediate_Int iCoeffQ   = (Intermediate_Int(clipQCoef) * scale + iAdd) >> rightShift;
245
2.87M
        piCoef[n] = TCoeff(Clip3<Intermediate_Int>(transformMinimum,transformMaximum,iCoeffQ));
246
2.87M
      }
247
296k
    }
248
34.8k
  }
249
9.48k
  else  // rightshift <0
250
9.48k
  {
251
9.48k
    int leftShift = -rightShift;
252
113k
    for( int y = 0, n = 0; y <= maxY; y++)
253
103k
    {
254
1.24M
      for( int x = 0; x <= maxX; x++, n++ )
255
1.14M
      {
256
1.14M
        const TCoeff           clipQCoef = TCoeff(Clip3<Intermediate_Int>(inputMinimum, inputMaximum, piQCoef[x + y * piQCfStride]));
257
1.14M
        const Intermediate_Int iCoeffQ   = (Intermediate_Int(clipQCoef) * scale) * (1 << leftShift);
258
1.14M
        piCoef[n] = TCoeff(Clip3<Intermediate_Int>(transformMinimum,transformMaximum,iCoeffQ));
259
1.14M
      }
260
103k
    }
261
9.48k
  }
262
44.3k
}
263
264
static bool needRdoqCore( const TCoeff* pCoeff, size_t numCoeff, int quantCoeff, int64_t offset, int shift )
265
0
{
266
0
  for( int uiBlockPos = 0; uiBlockPos < numCoeff; uiBlockPos++ )
267
0
  {
268
0
    const TCoeff   iLevel = pCoeff[uiBlockPos];
269
0
    const int64_t  tmpLevel = ( int64_t ) std::abs( iLevel ) * quantCoeff;
270
0
    const TCoeff quantisedMagnitude = TCoeff( ( tmpLevel + offset ) >> shift );
271
272
0
    if( quantisedMagnitude != 0 )
273
0
    {
274
0
      return true;
275
0
    }
276
0
  } // for n
277
0
  return false;
278
0
}
279
280
281
17.7k
Quant::Quant( const Quant* other, bool useScalingLists ) : m_RDOQ( 0 ), m_useRDOQTS( false ), m_dLambda( 0.0 )
282
17.7k
{
283
17.7k
  xInitScalingList( other, useScalingLists );
284
17.7k
  xDeQuant  = DeQuantCore;
285
17.7k
  xQuant    = QuantCore;
286
17.7k
  xNeedRdoq = needRdoqCore;
287
#if defined( TARGET_SIMD_X86 ) && ENABLE_SIMD_OPT_QUANT
288
  initQuantX86();
289
#endif
290
291
17.7k
}
292
293
Quant::~Quant()
294
17.7k
{
295
17.7k
  xDestroyScalingList();
296
17.7k
}
297
298
void invResDPCM( const TransformUnit& tu, const ComponentID compID, CoeffSigBuf& dstBuf )
299
44.3k
{
300
44.3k
  const CompArea&    rect   = tu.blocks[compID];
301
44.3k
  const int          wdt    = rect.width;
302
44.3k
  const int          hgt    = rect.height;
303
44.3k
  const CCoeffSigBuf coeffs = tu.getCoeffs(compID);
304
305
44.3k
  const int      maxLog2TrDynamicRange = tu.cs->sps->getMaxLog2TrDynamicRange();
306
44.3k
  const TCoeff   inputMinimum          = -(1 << maxLog2TrDynamicRange);
307
44.3k
  const TCoeff   inputMaximum          =  (1 << maxLog2TrDynamicRange) - 1;
308
309
44.3k
  const TCoeffSig* coef = &coeffs.buf[0];
310
44.3k
        TCoeffSig* dst  = &dstBuf.buf[0];
311
312
44.3k
  if ( tu.cu->bdpcmM[toChannelType(compID)] == 1)
313
500
  {
314
7.16k
    for( int y = 0; y < hgt; y++ )
315
6.66k
    {
316
6.66k
      dst[0] = coef[0];
317
106k
      for( int x = 1; x < wdt; x++ )
318
100k
      {
319
100k
        dst[x] = Clip3(inputMinimum, inputMaximum, TCoeff( dst[x - 1] ) + TCoeff( coef[x] ));
320
100k
      }
321
6.66k
      coef += coeffs.stride;
322
6.66k
      dst += dstBuf.stride;
323
6.66k
    }
324
500
  }
325
43.8k
  else
326
43.8k
  {
327
462k
    for( int x = 0; x < wdt; x++ )
328
418k
    {
329
418k
      dst[x] = coef[x];
330
418k
    }
331
393k
    for( int y = 0; y < hgt - 1; y++ )
332
349k
    {
333
3.84M
      for( int x = 0; x < wdt; x++ )
334
3.49M
      {
335
3.49M
        dst[dstBuf.stride + x] = Clip3(inputMinimum, inputMaximum, TCoeff( dst[x] ) + TCoeff( coef[coeffs.stride + x] ));
336
3.49M
      }
337
349k
      coef += coeffs.stride;
338
349k
      dst += dstBuf.stride;
339
349k
    }
340
43.8k
  }
341
44.3k
}
342
343
void fwdResDPCM( TransformUnit& tu, const ComponentID compID )
344
5.24k
{
345
5.24k
  const CompArea& rect   = tu.blocks[compID];
346
5.24k
  const int       wdt    = rect.width;
347
5.24k
  const int       hgt    = rect.height;
348
5.24k
  CoeffSigBuf     coeffs = tu.getCoeffs(compID);
349
350
5.24k
  TCoeffSig* coef = &coeffs.buf[0];
351
5.24k
  if (tu.cu->bdpcmM[toChannelType(compID)] == 1)
352
0
  {
353
0
    for( int y = 0; y < hgt; y++ )
354
0
    {
355
0
      for( int x = wdt - 1; x > 0; x-- )
356
0
      {
357
0
        coef[x] -= coef[x - 1];
358
0
      }
359
0
      coef += coeffs.stride;
360
0
    }
361
0
  }
362
5.24k
  else
363
5.24k
  {
364
5.24k
    coef += coeffs.stride * (hgt - 1);
365
10.4k
    for( int y = 0; y < hgt - 1; y++ )
366
5.24k
    {
367
55.9k
      for ( int x = 0; x < wdt; x++ )
368
50.6k
      {
369
50.6k
        coef[x] -= coef[x - coeffs.stride];
370
50.6k
      }
371
5.24k
      coef -= coeffs.stride;
372
5.24k
    }
373
5.24k
  }
374
5.24k
}
375
376
// To minimize the distortion only. No rate is considered.
377
void Quant::xSignBitHidingHDQ( TCoeffSig* pQCoef, const TCoeff* pCoef, TCoeff* deltaU, const CoeffCodingContext& cctx, int& lastScanPos, const int maxLog2TrDynamicRange )
378
0
{
379
0
  const uint32_t groupSize = 1 << cctx.log2CGSize();
380
381
0
  const TCoeff entropyCodingMinimum = -(1 << maxLog2TrDynamicRange);
382
0
  const TCoeff entropyCodingMaximum =  (1 << maxLog2TrDynamicRange) - 1;
383
384
0
  int lastCG = -1;
385
0
  int absSum = 0 ;
386
0
  int n ;
387
388
0
  for( int subSet = lastScanPos >> cctx.log2CGSize(); subSet >= 0; subSet-- )
389
0
  {
390
0
    int  subPos = subSet << cctx.log2CGSize();
391
0
    int  firstNZPosInCG=groupSize , lastNZPosInCG=-1 ;
392
0
    absSum = 0 ;
393
394
0
    for(n = groupSize-1; n >= 0; --n )
395
0
    {
396
0
      if( pQCoef[ cctx.blockPos( n + subPos ) ] )
397
0
      {
398
0
        lastNZPosInCG = n;
399
0
        break;
400
0
      }
401
0
    }
402
403
0
    for(n = 0; n <groupSize; n++ )
404
0
    {
405
0
      if( pQCoef[ cctx.blockPos( n + subPos ) ] )
406
0
      {
407
0
        firstNZPosInCG = n;
408
0
        break;
409
0
      }
410
0
    }
411
412
0
    for(n = firstNZPosInCG; n <=lastNZPosInCG; n++ )
413
0
    {
414
0
      absSum += int(pQCoef[ cctx.blockPos( n + subPos ) ]);
415
0
    }
416
417
0
    if(lastNZPosInCG>=0 && lastCG==-1)
418
0
    {
419
0
      lastCG = 1 ;
420
0
    }
421
422
0
    if( lastNZPosInCG-firstNZPosInCG>=SBH_THRESHOLD )
423
0
    {
424
0
      uint32_t signbit = (pQCoef[cctx.blockPos(subPos+firstNZPosInCG)]>0?0:1) ;
425
0
      if( signbit!=(absSum&0x1) )  //compare signbit with sum_parity
426
0
      {
427
0
        TCoeff curCost    = std::numeric_limits<TCoeff>::max();
428
0
        TCoeff minCostInc = std::numeric_limits<TCoeff>::max();
429
0
        int minPos =-1, finalChange=0, curChange=0, minScanPos = -1;
430
431
0
        for( n = (lastCG==1?lastNZPosInCG:groupSize-1) ; n >= 0; --n )
432
0
        {
433
0
          uint32_t blkPos   = cctx.blockPos( n+subPos );
434
0
          if(pQCoef[ blkPos ] != 0 )
435
0
          {
436
0
            if(deltaU[blkPos]>0)
437
0
            {
438
0
              curCost = - deltaU[blkPos];
439
0
              curChange=1 ;
440
0
            }
441
0
            else
442
0
            {
443
              //curChange =-1;
444
0
              if(n==firstNZPosInCG && abs(pQCoef[blkPos])==1)
445
0
              {
446
0
                curCost = std::numeric_limits<TCoeff>::max();
447
0
              }
448
0
              else
449
0
              {
450
0
                curCost = deltaU[blkPos];
451
0
                curChange =-1;
452
0
              }
453
0
            }
454
0
          }
455
0
          else
456
0
          {
457
0
            if(n<firstNZPosInCG)
458
0
            {
459
0
              uint32_t thisSignBit = (pCoef[blkPos]>=0?0:1);
460
0
              if(thisSignBit != signbit )
461
0
              {
462
0
                curCost = std::numeric_limits<TCoeff>::max();
463
0
              }
464
0
              else
465
0
              {
466
0
                curCost = - (deltaU[blkPos])  ;
467
0
                curChange = 1 ;
468
0
              }
469
0
            }
470
0
            else
471
0
            {
472
0
              curCost = - (deltaU[blkPos])  ;
473
0
              curChange = 1 ;
474
0
            }
475
0
          }
476
477
0
          if( curCost<minCostInc)
478
0
          {
479
0
            minCostInc = curCost ;
480
0
            finalChange = curChange ;
481
0
            minPos = blkPos;
482
0
            minScanPos = n + subPos;
483
0
          }
484
0
        } //CG loop
485
486
0
        if(pQCoef[minPos] == entropyCodingMaximum || pQCoef[minPos] == entropyCodingMinimum)
487
0
        {
488
0
          finalChange = -1;
489
0
        }
490
491
0
        if(pCoef[minPos]>=0)
492
0
        {
493
0
          pQCoef[minPos] += finalChange ;
494
0
        }
495
0
        else
496
0
        {
497
0
          pQCoef[minPos] -= finalChange ;
498
0
        }
499
500
        // if changing lastScanPos element to 0, move the pointer to the new lastScanPos element
501
0
        if( minScanPos == lastScanPos && pQCoef[minPos] == 0 )
502
0
        {
503
0
          for( ; lastScanPos >= 0 && pQCoef[cctx.blockPos( lastScanPos )] == 0; lastScanPos-- );
504
0
        }
505
0
        else if( minScanPos > lastScanPos && pQCoef[minPos] != 0 )
506
0
        {
507
0
          lastScanPos = minPos;
508
0
        }
509
0
      } // Hide
510
0
    }
511
0
    if(lastCG==1)
512
0
    {
513
0
      lastCG=0 ;
514
0
    }
515
0
  } // TU loop
516
517
0
  return;
518
0
}
519
520
void Quant::dequant(const TransformUnit& tu,
521
                          CoeffBuf&      dstCoeff,
522
                    const ComponentID    compID,
523
                    const QpParam&       cQP)
524
44.3k
{
525
44.3k
  const SPS       *sps                  = tu.cs->sps;
526
44.3k
  const CompArea  &area                 = tu.blocks[compID];
527
44.3k
  const uint32_t  uiWidth               = area.width;
528
44.3k
  const uint32_t  uiHeight              = area.height;
529
44.3k
  TCoeff *const   piCoef                = dstCoeff.buf;
530
44.3k
  const uint32_t  numSamplesInBlock     = uiWidth * uiHeight;
531
44.3k
  const int       maxLog2TrDynamicRange = sps->getMaxLog2TrDynamicRange();
532
44.3k
  const TCoeff    transformMinimum      = -(1 << maxLog2TrDynamicRange);
533
44.3k
  const TCoeff    transformMaximum      =  (1 << maxLog2TrDynamicRange) - 1;
534
44.3k
  const bool      isTransformSkip       = tu.mtsIdx[compID] == MTS_SKIP;
535
44.3k
  const bool      isLfnstApplied        = tu.cu->lfnstIdx > 0 && (CU::isSepTree(*tu.cu) ? true : isLuma(compID));
536
44.3k
  const bool      enableScalingLists    = getUseScalingList(uiWidth, uiHeight, isTransformSkip, isLfnstApplied);
537
44.3k
  const int       scalingListType       = getScalingListType(tu.cu->predMode, compID);
538
44.3k
  const int       channelBitDepth       = sps->bitDepths[toChannelType(compID)];
539
540
44.3k
  const TCoeffSig *coef     = tu.getCoeffs( compID ).buf;
541
44.3k
  const ptrdiff_t  piStride = tu.getCoeffs( compID ).stride;
542
543
44.3k
  if( tu.cu->bdpcmM[toChannelType( compID )] )
544
44.3k
  {
545
44.3k
    CoeffSigBuf coefBuf( m_tmpBdpcm, uiWidth, uiHeight );
546
44.3k
    invResDPCM( tu, compID, coefBuf );
547
44.3k
    coef      = m_tmpBdpcm;
548
44.3k
  }
549
550
44.3k
  const TCoeffSig  *const piQCoef = coef;
551
44.3k
  CHECK(scalingListType >= SCALING_LIST_NUM, "Invalid scaling list");
552
553
  // Represents scaling through forward transform
554
44.3k
  const int  originalTransformShift = getTransformShift(channelBitDepth, area.size(), maxLog2TrDynamicRange);
555
44.3k
  const bool needSqrtAdjustment     = TU::needsSqrt2Scale( tu, compID );
556
44.3k
  const int  iTransformShift        = originalTransformShift + (needSqrtAdjustment?-1:0);
557
558
44.3k
  const int QP_per = cQP.per(isTransformSkip);
559
44.3k
  const int QP_rem = cQP.rem(isTransformSkip);
560
561
44.3k
  const int  rightShift = (IQUANT_SHIFT - ((isTransformSkip ? 0 : iTransformShift) + QP_per)) + (enableScalingLists ? LOG2_SCALING_LIST_NEUTRAL_VALUE : 0);
562
563
44.3k
  if(enableScalingLists)
564
0
  {
565
    //from the dequantization equation:
566
    //iCoeffQ                         = ((Intermediate_Int(clipQCoef) * piDequantCoef[deQuantIdx]) + iAdd ) >> rightShift
567
    //(sizeof(Intermediate_Int) * 8)  =              inputBitDepth    +    dequantCoefBits                   - rightShift
568
0
    const uint32_t             dequantCoefBits     = 1 + IQUANT_SHIFT + SCALING_LIST_BITS;
569
0
    const uint32_t             targetInputBitDepth = std::min<uint32_t>((maxLog2TrDynamicRange + 1), (((sizeof(Intermediate_Int) * 8) + rightShift) - dequantCoefBits));
570
571
0
    const Intermediate_Int inputMinimum        = -(1 << (targetInputBitDepth - 1));
572
0
    const Intermediate_Int inputMaximum        =  (1 << (targetInputBitDepth - 1)) - 1;
573
574
0
    const uint32_t uiLog2TrWidth  = Log2(uiWidth);
575
0
    const uint32_t uiLog2TrHeight = Log2(uiHeight);
576
0
    int* piDequantCoef            = getDequantCoeff(scalingListType, QP_rem, uiLog2TrWidth, uiLog2TrHeight);
577
578
0
    if(rightShift > 0)
579
0
    {
580
0
      const Intermediate_Int iAdd = (Intermediate_Int) 1 << (rightShift - 1);
581
0
      for( int n = 0; n < numSamplesInBlock; n++ )
582
0
      {
583
0
        const TCoeff           clipQCoef = TCoeff(Clip3<Intermediate_Int>(inputMinimum, inputMaximum, piQCoef[n]));
584
0
        const Intermediate_Int iCoeffQ   = ((Intermediate_Int(clipQCoef) * piDequantCoef[n]) + iAdd ) >> rightShift;
585
0
        piCoef[n] = TCoeff(Clip3<Intermediate_Int>(transformMinimum,transformMaximum,iCoeffQ));
586
0
      }
587
0
    }
588
0
    else
589
0
    {
590
0
      const int leftShift = -rightShift;
591
0
      for( int n = 0; n < numSamplesInBlock; n++ )
592
0
      {
593
0
        const TCoeff           clipQCoef = TCoeff(Clip3<Intermediate_Int>(inputMinimum, inputMaximum, piQCoef[n]));
594
0
        const Intermediate_Int iCoeffQ   = (Intermediate_Int(clipQCoef) * piDequantCoef[n]) << leftShift;
595
0
        piCoef[n] = TCoeff(Clip3<Intermediate_Int>(transformMinimum,transformMaximum,iCoeffQ));
596
0
      }
597
0
    }
598
0
  }
599
44.3k
  else
600
44.3k
  {
601
44.3k
    const int scale     = g_invQuantScales[needSqrtAdjustment?1:0][QP_rem];
602
44.3k
    const int scaleBits = ( IQUANT_SHIFT + 1 );
603
    //from the dequantisation equation:
604
    //iCoeffQ                         = Intermediate_Int((int64_t(clipQCoef) * scale + iAdd) >> rightShift);
605
    //(sizeof(Intermediate_Int) * 8)  =                    inputBitDepth   + scaleBits      - rightShift
606
44.3k
    const uint32_t             targetInputBitDepth = std::min<uint32_t>((maxLog2TrDynamicRange + 1), (((sizeof(Intermediate_Int) * 8) + rightShift) - scaleBits));
607
44.3k
    const Intermediate_Int inputMaximum        =  (1 << (targetInputBitDepth - 1)) - 1;
608
44.3k
    xDeQuant(uiWidth-1,uiHeight-1,scale,piQCoef,piStride,piCoef,rightShift,inputMaximum,transformMaximum);
609
44.3k
  }
610
44.3k
}
611
612
void Quant::init( int rdoq, bool bUseRDOQTS, int thrVal )
613
17.7k
{
614
615
  // TODO: pass to init() a single variable containing (quantization) flags,
616
  //       instead of variables that don't have to do with this class
617
618
17.7k
  m_RDOQ             = rdoq;
619
17.7k
  m_useRDOQTS        = bUseRDOQTS;
620
17.7k
  m_thrVal           = thrVal;
621
17.7k
}
622
623
/** set flat matrix value to quantized coefficient
624
 */
625
void Quant::setFlatScalingList(const int maxLog2TrDynamicRange[MAX_NUM_CH], const BitDepths &bitDepths )
626
17.7k
{
627
17.7k
  if( !m_scalingListEnabled ) return;
628
629
0
  const int minimumQp = 0;
630
0
  const int maximumQp = SCALING_LIST_REM_NUM;
631
632
0
  for(uint32_t sizeX = 0; sizeX < SCALING_LIST_SIZE_NUM; sizeX++)
633
0
  {
634
0
    for(uint32_t sizeY = 0; sizeY < SCALING_LIST_SIZE_NUM; sizeY++)
635
0
    {
636
0
      for(uint32_t list = 0; list < SCALING_LIST_NUM; list++)
637
0
      {
638
0
        for(int qp = minimumQp; qp < maximumQp; qp++)
639
0
        {
640
0
          xSetFlatScalingList( list, sizeX, sizeY, qp );
641
0
        }
642
0
      }
643
0
    }
644
0
  }
645
0
}
646
647
/** set flat matrix value to quantized coefficient
648
 * \param list List ID
649
 * \param size size index
650
 * \param qp Quantization parameter
651
 * \param format chroma format
652
 */
653
void Quant::xSetFlatScalingList(uint32_t list, uint32_t sizeX, uint32_t sizeY, int qp )
654
0
{
655
0
  uint32_t i,num = g_scalingListSizeX[sizeX]*g_scalingListSizeX[sizeY];
656
0
  int *quantcoeff;
657
0
  int *dequantcoeff;
658
659
0
  const bool blockIsNotPowerOf4 = ((Log2(g_scalingListSizeX[sizeX] * g_scalingListSizeX[sizeY])) & 1) == 1;
660
0
  int quantScales    = g_quantScales   [blockIsNotPowerOf4?1:0][qp];
661
0
  int invQuantScales = g_invQuantScales[blockIsNotPowerOf4?1:0][qp] << 4;
662
663
0
  quantcoeff   = getQuantCoeff(list, qp, sizeX, sizeY);
664
0
  dequantcoeff = getDequantCoeff(list, qp, sizeX, sizeY);
665
666
0
  for(i=0;i<num;i++)
667
0
  {
668
0
    *quantcoeff++ = quantScales;
669
0
    *dequantcoeff++ = invQuantScales;
670
0
  }
671
0
}
672
673
674
/** initialization process of scaling list array
675
 */
676
void Quant::xInitScalingList( const Quant* other, bool useScalingLists )
677
17.7k
{
678
17.7k
  m_isScalingListOwner = other == nullptr;
679
17.7k
  m_scalingListEnabled = useScalingLists;
680
681
142k
  for(uint32_t sizeIdX = 0; sizeIdX < SCALING_LIST_SIZE_NUM; sizeIdX++)
682
124k
  {
683
995k
    for(uint32_t sizeIdY = 0; sizeIdY < SCALING_LIST_SIZE_NUM; sizeIdY++)
684
871k
    {
685
6.09M
      for(uint32_t qp = 0; qp < SCALING_LIST_REM_NUM; qp++)
686
5.22M
      {
687
36.5M
        for(uint32_t listId = 0; listId < SCALING_LIST_NUM; listId++)
688
31.3M
        {
689
31.3M
          if( m_isScalingListOwner )
690
31.3M
          {
691
31.3M
            const size_t scalingListSize = g_scalingListSizeX[sizeIdX] * g_scalingListSizeX[sizeIdY];
692
693
31.3M
            m_quantCoef   [sizeIdX][sizeIdY][listId][qp] = useScalingLists ? new int[scalingListSize] : nullptr;
694
31.3M
            m_dequantCoef [sizeIdX][sizeIdY][listId][qp] = useScalingLists ? new int[scalingListSize] : nullptr;
695
31.3M
          }
696
0
          else
697
0
          {
698
0
            m_quantCoef   [sizeIdX][sizeIdY][listId][qp] = other->m_quantCoef   [sizeIdX][sizeIdY][listId][qp];
699
0
            m_dequantCoef [sizeIdX][sizeIdY][listId][qp] = other->m_dequantCoef [sizeIdX][sizeIdY][listId][qp];
700
0
          }
701
31.3M
        } // listID loop
702
5.22M
      }
703
871k
    }
704
124k
  }
705
17.7k
}
706
707
/** destroy quantization matrix array
708
 */
709
void Quant::xDestroyScalingList()
710
17.7k
{
711
17.7k
  if( !m_isScalingListOwner ) return;
712
713
142k
  for(uint32_t sizeIdX = 0; sizeIdX < SCALING_LIST_SIZE_NUM; sizeIdX++)
714
124k
  {
715
995k
    for(uint32_t sizeIdY = 0; sizeIdY < SCALING_LIST_SIZE_NUM; sizeIdY++)
716
871k
    {
717
6.09M
      for(uint32_t listId = 0; listId < SCALING_LIST_NUM; listId++)
718
5.22M
      {
719
36.5M
        for(uint32_t qp = 0; qp < SCALING_LIST_REM_NUM; qp++)
720
31.3M
        {
721
31.3M
          if(m_quantCoef[sizeIdX][sizeIdY][listId][qp])
722
0
          {
723
0
            delete [] m_quantCoef[sizeIdX][sizeIdY][listId][qp];
724
0
          }
725
31.3M
          if(m_dequantCoef[sizeIdX][sizeIdY][listId][qp])
726
0
          {
727
0
            delete [] m_dequantCoef[sizeIdX][sizeIdY][listId][qp];
728
0
          }
729
31.3M
        }
730
5.22M
      }
731
871k
    }
732
124k
  }
733
17.7k
}
734
735
void Quant::quant(TransformUnit& tu, const ComponentID compID, const CCoeffBuf& pSrc, TCoeff &uiAbsSum, const QpParam& cQP, const Ctx& ctx)
736
5.24k
{
737
5.24k
  const SPS &sps            = *tu.cs->sps;
738
5.24k
  const CompArea& rect      = tu.blocks[compID];
739
5.24k
  const uint32_t uiWidth    = rect.width;
740
5.24k
  const uint32_t uiHeight   = rect.height;
741
5.24k
  const int channelBitDepth = sps.bitDepths[toChannelType(compID)];
742
743
5.24k
  const CCoeffBuf&  piCoef  = pSrc;
744
5.24k
        CoeffSigBuf piQCoef = tu.getCoeffs(compID);
745
746
5.24k
  const bool useTransformSkip = tu.mtsIdx[compID] == MTS_SKIP;
747
5.24k
  const int  maxLog2TrDynamicRange = sps.getMaxLog2TrDynamicRange();
748
749
5.24k
  {
750
5.24k
    CoeffCodingContext cctx(tu, compID, tu.cs->slice->signDataHidingEnabled);
751
752
5.24k
    const TCoeff entropyCodingMinimum = -(1 << maxLog2TrDynamicRange);
753
5.24k
    const TCoeff entropyCodingMaximum =  (1 << maxLog2TrDynamicRange) - 1;
754
755
5.24k
    TCoeff deltaU[MAX_TB_SIZEY * MAX_TB_SIZEY];
756
5.24k
    int scalingListType           = getScalingListType(tu.cu->predMode, compID);
757
5.24k
    CHECK(scalingListType >= SCALING_LIST_NUM, "Invalid scaling list");
758
5.24k
    const uint32_t uiLog2TrWidth  = Log2(uiWidth);
759
5.24k
    const uint32_t uiLog2TrHeight = Log2(uiHeight);
760
5.24k
    int *piQuantCoeff             = getQuantCoeff(scalingListType, cQP.rem(useTransformSkip), uiLog2TrWidth, uiLog2TrHeight);
761
762
5.24k
    const bool isLfnstApplied     = tu.cu->lfnstIdx > 0 && (CU::isSepTree(*tu.cu) ? true : isLuma(compID));
763
5.24k
    const bool enableScalingLists = getUseScalingList(uiWidth, uiHeight, useTransformSkip, isLfnstApplied);
764
765
    // for blocks that where width*height != 4^N, the effective scaling applied during transformation cannot be
766
    // compensated by a bit-shift (the quantised result will be sqrt(2) * larger than required).
767
    // The quantScale table and shift is used to compensate for this.
768
5.24k
    const bool needSqrtAdjustment= TU::needsSqrt2Scale( tu, compID );
769
5.24k
    const int defaultQuantisationCoefficient    = g_quantScales[needSqrtAdjustment?1:0][cQP.rem(useTransformSkip)];
770
5.24k
    const int iTransformShift = getTransformShift(channelBitDepth, rect.size(), maxLog2TrDynamicRange) + ( needSqrtAdjustment?-1:0);
771
772
5.24k
    const int iQBits = QUANT_SHIFT + cQP.per(useTransformSkip) + (useTransformSkip ? 0 : iTransformShift);
773
    // QBits will be OK for any internal bit depth as the reduction in transform shift is balanced by an increase in Qp_per due to QpBDOffset
774
775
5.24k
    const int64_t iAdd = int64_t(tu.cs->slice->isIRAP() ? 171 : 85) << int64_t(iQBits - 9);
776
5.24k
    const int qBits8 = iQBits - 8;
777
778
5.24k
    int lastScanPos = -1;
779
780
5.24k
    if (!enableScalingLists)
781
5.24k
      xQuant(tu,compID,piCoef,piQCoef,uiAbsSum,lastScanPos,deltaU,defaultQuantisationCoefficient,iQBits,iAdd,entropyCodingMinimum,entropyCodingMaximum,cctx.signHiding(),m_thrVal);
782
0
    else
783
0
    {
784
0
      const uint32_t lfnstIdx = tu.cu->lfnstIdx;
785
0
      const int maxNumberOfCoeffs = lfnstIdx > 0 ? ( ( ( uiWidth == 4 && uiHeight == 4 ) || ( uiWidth == 8 && uiHeight == 8 ) ) ? 8 : 16 ) : piQCoef.area();
786
787
0
      piQCoef.memset( 0 );
788
0
      for (int uiScanPos = 0; uiScanPos < maxNumberOfCoeffs; uiScanPos++ )
789
0
      {
790
0
        const int uiBlockPos  = cctx.blockPos( uiScanPos );
791
0
        const TCoeff iLevel   = piCoef.buf[uiBlockPos];
792
0
        const TCoeff iSign    = (iLevel < 0 ? -1: 1);
793
794
0
        const int64_t  tmpLevel = (int64_t)abs(iLevel) * (enableScalingLists ? piQuantCoeff[uiBlockPos] : defaultQuantisationCoefficient);
795
0
        const TCoeff quantisedMagnitude = TCoeff((tmpLevel + iAdd ) >> iQBits);
796
0
        deltaU[uiBlockPos] = (TCoeff)((tmpLevel - ((int64_t)quantisedMagnitude<<iQBits) )>> qBits8);
797
798
0
        uiAbsSum += quantisedMagnitude;
799
0
        const TCoeff quantisedCoefficient = quantisedMagnitude * iSign;
800
801
0
        piQCoef.buf[uiBlockPos] = Clip3<TCoeff>( entropyCodingMinimum, entropyCodingMaximum, quantisedCoefficient );
802
0
      } // for n
803
0
    }
804
5.24k
    if (tu.cu->bdpcmM[toChannelType(compID)])
805
5.24k
    {
806
5.24k
      fwdResDPCM( tu, compID );
807
5.24k
    }
808
809
5.24k
    if( uiAbsSum )
810
3.14k
    {
811
6.28k
      for( int scanPos = lastScanPos; scanPos >= 0; scanPos-- )
812
6.28k
      {
813
6.28k
        unsigned blkPos = cctx.blockPos( scanPos );
814
6.28k
        if( piQCoef.buf[blkPos] )
815
3.14k
        {
816
3.14k
          lastScanPos = scanPos;
817
3.14k
          break;
818
3.14k
        }
819
6.28k
      }
820
821
3.14k
      if( cctx.signHiding() )
822
0
      {
823
0
        if( uiAbsSum >= 2 ) //this prevents TUs with only one coefficient of value 1 from being tested
824
0
        {
825
0
          xSignBitHidingHDQ( piQCoef.buf, piCoef.buf, deltaU, cctx, lastScanPos, maxLog2TrDynamicRange );
826
0
        }
827
0
      }
828
3.14k
    }
829
830
5.24k
    tu.lastPos[compID] = lastScanPos;
831
5.24k
  } //if RDOQ
832
  //return;
833
5.24k
}
834
835
bool Quant::xNeedRDOQ(TransformUnit& tu, const ComponentID compID, const CCoeffBuf& pSrc, const QpParam& cQP)
836
0
{
837
0
  const SPS &sps            = *tu.cs->sps;
838
0
  const CompArea& rect      = tu.blocks[compID];
839
0
  const uint32_t uiWidth    = rect.width;
840
0
  const uint32_t uiHeight   = rect.height;
841
0
  const uint32_t efHeight   = std::min<unsigned>( uiHeight, JVET_C0024_ZERO_OUT_TH );
842
0
  const uint32_t efArea     = uiWidth * efHeight;
843
0
  const int channelBitDepth = sps.bitDepths[toChannelType(compID)];
844
0
  const CCoeffBuf piCoef    = pSrc;
845
846
0
  const bool useTransformSkip      = tu.mtsIdx[compID] == MTS_SKIP;
847
0
  const int  maxLog2TrDynamicRange = sps.getMaxLog2TrDynamicRange();
848
849
0
  const int scalingListType     = getScalingListType( tu.cu->predMode, compID );
850
0
  CHECK( scalingListType >= SCALING_LIST_NUM, "Invalid scaling list" );
851
852
0
  const bool        isDq        = tu.cs->slice->depQuantEnabled && !useTransformSkip;
853
0
  const int         qpDQ        = isDq ? cQP.Qp( false ) + 1 : cQP.Qp( useTransformSkip );
854
0
  const int         qpPer       = isDq ? qpDQ / 6 : cQP.per( useTransformSkip );
855
0
  const int         qpRem       = isDq ? qpDQ - 6 * qpPer : cQP.rem( useTransformSkip );
856
857
0
  const uint32_t uiLog2TrWidth  = Log2( uiWidth );
858
0
  const uint32_t uiLog2TrHeight = Log2( uiHeight );
859
0
  int *piQuantCoeff             = getQuantCoeff( scalingListType, qpRem, uiLog2TrWidth, uiLog2TrHeight );
860
861
0
  const bool isLfnstApplied     = tu.cu->lfnstIdx > 0 && ( CU::isSepTree( *tu.cu ) ? true : isLuma( compID ) );
862
0
  const bool enableScalingLists = getUseScalingList( uiWidth, uiHeight, ( useTransformSkip != 0 ), isLfnstApplied );
863
864
0
  const bool needSqrtAdjustment = TU::needsSqrt2Scale( tu, compID );
865
0
  const int defaultQuantisationCoefficient
866
0
                                = g_quantScales[needSqrtAdjustment?1:0][qpRem];
867
0
  const int iTransformShift     = getTransformShift( channelBitDepth, rect.size(), maxLog2TrDynamicRange ) + ( needSqrtAdjustment ? -1 : 0 );
868
869
870
0
  const int iQBits              = QUANT_SHIFT + qpPer + iTransformShift;
871
872
  // QBits will be OK for any internal bit depth as the reduction in transform shift is balanced by an increase in Qp_per due to QpBDOffset
873
  // iAdd is different from the iAdd used in normal quantization
874
0
  const int64_t iAdd = int64_t( compID == COMP_Y ? 171 : 256 ) << ( iQBits - 9 );
875
876
0
  if( !enableScalingLists )
877
0
    return xNeedRdoq( piCoef.buf, efArea, defaultQuantisationCoefficient, iAdd, iQBits );
878
879
0
  for( int uiBlockPos = 0; uiBlockPos < efArea; uiBlockPos++ )
880
0
  {
881
0
    const TCoeff   iLevel           = piCoef.buf[uiBlockPos];
882
0
    const int64_t  tmpLevel         = ( int64_t ) std::abs( iLevel ) * piQuantCoeff[uiBlockPos];
883
0
    const TCoeff quantisedMagnitude = TCoeff( ( tmpLevel + iAdd ) >> iQBits );
884
885
0
    if( quantisedMagnitude != 0 )
886
0
    {
887
0
      return true;
888
0
    }
889
0
  } // for n
890
0
  return false;
891
0
}
892
893
} // namespace vvenc
894
895
//! \}
896