Coverage Report

Created: 2026-06-10 07:00

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/work/svt-av1/Source/Lib/Codec/entropy_coding.c
Line
Count
Source
1
/*
2
* Copyright(c) 2019 Intel Corporation
3
* Copyright (c) 2016, Alliance for Open Media. All rights reserved
4
*
5
* This source code is subject to the terms of the BSD 2 Clause License and
6
* the Alliance for Open Media Patent License 1.0. If the BSD 2 Clause License
7
* was not distributed with this source code in the LICENSE file, you can
8
* obtain it at https://www.aomedia.org/license/software-license. If the Alliance for Open
9
* Media Patent License 1.0 was not distributed with this source code in the
10
* PATENTS file, you can obtain it at https://www.aomedia.org/license/patent-license.
11
*/
12
13
#include <stdlib.h>
14
#include <string.h>
15
#include <math.h>
16
17
#include "EbSvtAv1.h"
18
#include "entropy_coding.h"
19
#include "utility.h"
20
#include "transforms.h"
21
#include "ec_process.h"
22
#include "common_utils.h"
23
#include "adaptive_mv_pred.h"
24
#include "rd_cost.h"
25
#include "svt_log.h"
26
#include "full_loop.h"
27
#include "aom_dsp_rtcd.h"
28
#include "inter_prediction.h"
29
#include "mode_decision.h"
30
#include "restoration.h"
31
32
4.10k
static void mem_put_varsize(uint8_t* const dst, const int sz, const int val) {
33
4.10k
    switch (sz) {
34
4.10k
    case 1:
35
4.10k
        dst[0] = (uint8_t)(val & 0xff);
36
4.10k
        break;
37
0
    case 2:
38
0
        mem_put_le16(dst, val);
39
0
        break;
40
0
    case 3:
41
0
        mem_put_le24(dst, val);
42
0
        break;
43
0
    case 4:
44
0
        mem_put_le32(dst, val);
45
0
        break;
46
0
    default:
47
0
        assert(0 && "Invalid size");
48
0
        break;
49
4.10k
    }
50
4.10k
}
51
52
int svt_aom_get_comp_index_context_enc(PictureParentControlSet* pcs, int cur_frame_index, int bck_frame_index,
53
0
                                       int fwd_frame_index, const MacroBlockD* xd) {
54
0
    const int fwd = abs(svt_aom_get_relative_dist_enc(&pcs->scs->seq_header, fwd_frame_index, cur_frame_index));
55
0
    const int bck = abs(svt_aom_get_relative_dist_enc(&pcs->scs->seq_header, cur_frame_index, bck_frame_index));
56
57
0
    const MbModeInfo* const above_mi  = xd->above_mbmi;
58
0
    const MbModeInfo* const left_mi   = xd->left_mbmi;
59
0
    const int               offset    = fwd == bck;
60
0
    int                     above_ctx = 0, left_ctx = 0;
61
62
0
    if (above_mi) {
63
0
        if (has_second_ref(&above_mi->block_mi)) {
64
0
            above_ctx = above_mi->block_mi.compound_idx;
65
0
        } else if (above_mi->block_mi.ref_frame[0] == ALTREF_FRAME) {
66
0
            above_ctx = 1;
67
0
        }
68
0
    }
69
70
0
    if (left_mi) {
71
0
        if (has_second_ref(&left_mi->block_mi)) {
72
0
            left_ctx = left_mi->block_mi.compound_idx;
73
0
        } else if (left_mi->block_mi.ref_frame[0] == ALTREF_FRAME) {
74
0
            left_ctx = 1;
75
0
        }
76
0
    }
77
0
    return above_ctx + left_ctx + 3 * offset;
78
0
}
79
80
0
int svt_aom_get_comp_group_idx_context_enc(const MacroBlockD* xd) {
81
0
    const MbModeInfo* const above_mi  = xd->above_mbmi;
82
0
    const MbModeInfo* const left_mi   = xd->left_mbmi;
83
0
    int                     above_ctx = 0, left_ctx = 0;
84
0
    if (above_mi) {
85
0
        if (has_second_ref(&above_mi->block_mi)) {
86
0
            above_ctx = above_mi->block_mi.comp_group_idx;
87
0
        } else if (above_mi->block_mi.ref_frame[0] == ALTREF_FRAME) {
88
0
            above_ctx = 3;
89
0
        }
90
0
    }
91
0
    if (left_mi) {
92
0
        if (has_second_ref(&left_mi->block_mi)) {
93
0
            left_ctx = left_mi->block_mi.comp_group_idx;
94
0
        } else if (left_mi->block_mi.ref_frame[0] == ALTREF_FRAME) {
95
0
            left_ctx = 3;
96
0
        }
97
0
    }
98
0
    return AOMMIN(5, above_ctx + left_ctx);
99
0
}
100
101
static INLINE int32_t does_level_match(int32_t width, int32_t height, double fps, int32_t lvl_width, int32_t lvl_height,
102
860
                                       double lvl_fps, int32_t lvl_dim_mult) {
103
860
    const int64_t lvl_luma_pels           = (int64_t)lvl_width * lvl_height;
104
860
    const double  lvl_display_sample_rate = lvl_luma_pels * lvl_fps;
105
860
    const int64_t luma_pels               = (int64_t)width * height;
106
860
    const double  display_sample_rate     = luma_pels * fps;
107
860
    return luma_pels <= lvl_luma_pels && display_sample_rate <= lvl_display_sample_rate &&
108
860
        width <= lvl_width * lvl_dim_mult && height <= lvl_height * lvl_dim_mult;
109
860
}
110
111
860
static void set_bitstream_level_tier(SequenceControlSet* scs) {
112
    // This is a placeholder function that only addresses dimensions
113
    // and max display sample rates.
114
    // Need to add checks for max bit rate, max decoded luma sample rate, header
115
    // rate, etc. that are not covered by this function.
116
117
860
    BitstreamLevel bl = {9, 3};
118
860
    if (scs->static_config.level) {
119
0
        bl.major = scs->static_config.level / 10;
120
0
        bl.minor = scs->static_config.level % 10;
121
860
    } else if (does_level_match(scs->seq_header.max_frame_width,
122
860
                                scs->seq_header.max_frame_height,
123
860
                                scs->frame_rate,
124
860
                                512,
125
860
                                288,
126
860
                                30.0,
127
860
                                4)) {
128
860
        bl.major = 2;
129
860
        bl.minor = 0;
130
860
    } else if (does_level_match(scs->seq_header.max_frame_width,
131
0
                                scs->seq_header.max_frame_height,
132
0
                                scs->frame_rate,
133
0
                                704,
134
0
                                396,
135
0
                                30.0,
136
0
                                4)) {
137
0
        bl.major = 2;
138
0
        bl.minor = 1;
139
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
140
0
                                scs->seq_header.max_frame_height,
141
0
                                scs->frame_rate,
142
0
                                1088,
143
0
                                612,
144
0
                                30.0,
145
0
                                4)) {
146
0
        bl.major = 3;
147
0
        bl.minor = 0;
148
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
149
0
                                scs->seq_header.max_frame_height,
150
0
                                scs->frame_rate,
151
0
                                1376,
152
0
                                774,
153
0
                                30.0,
154
0
                                4)) {
155
0
        bl.major = 3;
156
0
        bl.minor = 1;
157
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
158
0
                                scs->seq_header.max_frame_height,
159
0
                                scs->frame_rate,
160
0
                                2048,
161
0
                                1152,
162
0
                                30.0,
163
0
                                3)) {
164
0
        bl.major = 4;
165
0
        bl.minor = 0;
166
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
167
0
                                scs->seq_header.max_frame_height,
168
0
                                scs->frame_rate,
169
0
                                2048,
170
0
                                1152,
171
0
                                60.0,
172
0
                                3)) {
173
0
        bl.major = 4;
174
0
        bl.minor = 1;
175
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
176
0
                                scs->seq_header.max_frame_height,
177
0
                                scs->frame_rate,
178
0
                                4096,
179
0
                                2176,
180
0
                                30.0,
181
0
                                2)) {
182
0
        bl.major = 5;
183
0
        bl.minor = 0;
184
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
185
0
                                scs->seq_header.max_frame_height,
186
0
                                scs->frame_rate,
187
0
                                4096,
188
0
                                2176,
189
0
                                60.0,
190
0
                                2)) {
191
0
        bl.major = 5;
192
0
        bl.minor = 1;
193
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
194
0
                                scs->seq_header.max_frame_height,
195
0
                                scs->frame_rate,
196
0
                                4096,
197
0
                                2176,
198
0
                                120.0,
199
0
                                2)) {
200
0
        bl.major = 5;
201
0
        bl.minor = 2;
202
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
203
0
                                scs->seq_header.max_frame_height,
204
0
                                scs->frame_rate,
205
0
                                8192,
206
0
                                4352,
207
0
                                30.0,
208
0
                                2)) {
209
0
        bl.major = 6;
210
0
        bl.minor = 0;
211
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
212
0
                                scs->seq_header.max_frame_height,
213
0
                                scs->frame_rate,
214
0
                                8192,
215
0
                                4352,
216
0
                                60.0,
217
0
                                2)) {
218
0
        bl.major = 6;
219
0
        bl.minor = 1;
220
0
    } else if (does_level_match(scs->seq_header.max_frame_width,
221
0
                                scs->seq_header.max_frame_height,
222
0
                                scs->frame_rate,
223
0
                                8192,
224
0
                                4352,
225
0
                                120.0,
226
0
                                2)) {
227
0
        bl.major = 6;
228
0
        bl.minor = 2;
229
0
    }
230
28.3k
    for (int32_t i = 0; i < MAX_NUM_OPERATING_POINTS; ++i) {
231
27.5k
        scs->level[i]                               = bl;
232
27.5k
        scs->seq_header.operating_point[i].seq_tier = 0; // setting main tier by default
233
27.5k
    }
234
860
}
235
236
12.7k
static INLINE void write_golomb(AomWriter* w, int32_t level) {
237
12.7k
    const int32_t  x      = level + 1;
238
12.7k
    const uint32_t length = svt_log2f(x) + 1;
239
12.7k
    assert(length > 0);
240
241
12.7k
    aom_write_literal(w, 0, length - 1);
242
12.7k
    aom_write_literal(w, x, length);
243
12.7k
}
244
245
/************************************************************************************************/
246
// blockd.h
247
248
void svt_aom_get_txb_ctx(PictureControlSet* pcs, const int32_t plane,
249
                         NeighborArrayUnit* dc_sign_level_coeff_neighbor_array, uint32_t blk_org_x, uint32_t blk_org_y,
250
                         const BlockSize plane_bsize, const TxSize tx_size, int16_t* const txb_skip_ctx,
251
22.1k
                         int16_t* const dc_sign_ctx) {
252
    /* Hoist NA ring pointers and iterate them directly. Shape-B PU NA. */
253
22.1k
    const uint8_t* const top_ptr  = svt_aom_na_top_ptr_pu(dc_sign_level_coeff_neighbor_array, blk_org_x);
254
22.1k
    const uint8_t* const left_ptr = svt_aom_na_left_ptr_pu(dc_sign_level_coeff_neighbor_array, blk_org_y);
255
256
22.1k
    static const int8_t signs[3]    = {0, -1, 1};
257
22.1k
    const int32_t       plane_shift = !!plane;
258
22.1k
    int32_t             txb_w_unit  = MIN(eb_tx_size_wide_unit[tx_size],
259
22.1k
                             (int32_t)((pcs->ppcs->aligned_width >> plane_shift) - blk_org_x) >> 2);
260
22.1k
    int32_t             txb_h_unit  = MIN(eb_tx_size_high_unit[tx_size],
261
22.1k
                             (int32_t)((pcs->ppcs->aligned_height >> plane_shift) - blk_org_y) >> 2);
262
263
22.1k
    int16_t dc_sign = 0;
264
22.1k
    int32_t top     = 0; /* OR-accumulation across neighbors */
265
22.1k
    int32_t left    = 0;
266
267
    /* Combined top sweep: dc_sign + OR-accumulated top. */
268
22.1k
    if (top_ptr[0] != INVALID_NEIGHBOR_DATA) {
269
14.1k
        for (int32_t k = 0; k < txb_w_unit; ++k) {
270
9.22k
            uint8_t v    = top_ptr[k];
271
9.22k
            uint8_t sign = v >> COEFF_CONTEXT_BITS;
272
9.22k
            assert(sign <= 2);
273
9.22k
            dc_sign += signs[sign];
274
9.22k
            top |= v;
275
9.22k
        }
276
4.88k
    }
277
    /* Combined left sweep: dc_sign + OR-accumulated left. */
278
22.1k
    if (left_ptr[0] != INVALID_NEIGHBOR_DATA) {
279
23.8k
        for (int32_t k = 0; k < txb_h_unit; ++k) {
280
18.2k
            uint8_t v    = left_ptr[k];
281
18.2k
            uint8_t sign = v >> COEFF_CONTEXT_BITS;
282
18.2k
            assert(sign <= 2);
283
18.2k
            dc_sign += signs[sign];
284
18.2k
            left |= v;
285
18.2k
        }
286
5.65k
    }
287
288
22.1k
    if (dc_sign > 0) {
289
0
        *dc_sign_ctx = 2;
290
22.1k
    } else if (dc_sign < 0) {
291
6.57k
        *dc_sign_ctx = 1;
292
15.5k
    } else {
293
15.5k
        *dc_sign_ctx = 0;
294
15.5k
    }
295
296
22.1k
    int32_t tx_bsize = txsize_to_bsize[tx_size];
297
22.1k
    if (plane == 0) {
298
11.3k
        if (plane_bsize == tx_bsize) {
299
3.43k
            *txb_skip_ctx = 0;
300
7.91k
        } else {
301
7.91k
            static const uint8_t skip_contexts[5][5] = {
302
7.91k
                {1, 2, 2, 2, 3}, {1, 4, 4, 4, 5}, {1, 4, 4, 4, 5}, {1, 4, 4, 4, 5}, {1, 4, 4, 4, 6}};
303
7.91k
            top &= COEFF_CONTEXT_MASK;
304
7.91k
            left &= COEFF_CONTEXT_MASK;
305
7.91k
            int32_t max = AOMMIN(top | left, 4);
306
7.91k
            int32_t min = AOMMIN(AOMMIN(top, left), 4);
307
308
7.91k
            *txb_skip_ctx = skip_contexts[min][max];
309
7.91k
        }
310
11.3k
    } else {
311
10.8k
        int32_t ctx_base   = ((left != 0) + (top != 0));
312
10.8k
        int32_t ctx_offset = (eb_num_pels_log2_lookup[plane_bsize] > eb_num_pels_log2_lookup[tx_bsize]) ? 10 : 7;
313
10.8k
        *txb_skip_ctx      = (int16_t)(ctx_base + ctx_offset);
314
10.8k
    }
315
22.1k
}
316
317
static void av1_write_tx_type(PictureParentControlSet* pcs, FRAME_CONTEXT* frame_context, MbModeInfo* mbmi,
318
5.15k
                              AomWriter* ec_writer, uint32_t intraDir, TxType tx_type, TxSize tx_size) {
319
5.15k
    FrameHeader*  frm_hdr  = &pcs->frm_hdr;
320
5.15k
    const int32_t is_inter = mbmi->block_mi.use_intrabc || is_inter_mode(mbmi->block_mi.mode);
321
5.15k
    if (get_ext_tx_types(tx_size, is_inter, frm_hdr->reduced_tx_set) > 1 &&
322
2.70k
        (frm_hdr->quantization_params.base_q_idx > 0)) {
323
726
        const TxSize square_tx_size = txsize_sqr_map[tx_size];
324
726
        assert(square_tx_size <= EXT_TX_SIZES);
325
326
726
        const TxSetType tx_set_type = get_ext_tx_set_type(tx_size, is_inter, frm_hdr->reduced_tx_set);
327
726
        const int32_t   eset        = get_ext_tx_set(tx_size, is_inter, frm_hdr->reduced_tx_set);
328
        // eset == 0 should correspond to a set with only DCT_DCT and there
329
        // is no need to send the tx_type
330
726
        assert(eset > 0);
331
726
        assert(av1_ext_tx_used[tx_set_type][tx_type]);
332
726
        if (is_inter) {
333
0
            aom_write_symbol(ec_writer,
334
0
                             av1_ext_tx_ind[tx_set_type][tx_type],
335
0
                             frame_context->inter_ext_tx_cdf[eset][square_tx_size],
336
0
                             av1_num_ext_tx_set[tx_set_type]);
337
726
        } else {
338
726
            PredictionMode intra_dir;
339
726
            if (mbmi->block_mi.filter_intra_mode != FILTER_INTRA_MODES) {
340
0
                intra_dir = fimode_to_intradir[mbmi->block_mi.filter_intra_mode];
341
726
            } else {
342
726
                intra_dir = intraDir;
343
726
            }
344
345
726
            assert(intra_dir < 13);
346
726
            assert(square_tx_size < 4);
347
726
            aom_write_symbol(ec_writer,
348
726
                             av1_ext_tx_ind[tx_set_type][tx_type],
349
726
                             frame_context->intra_ext_tx_cdf[eset][square_tx_size][intra_dir],
350
726
                             av1_num_ext_tx_set[tx_set_type]);
351
726
        }
352
726
    }
353
5.15k
}
354
355
static int32_t av1_write_coeffs_txb_1d(PictureParentControlSet* ppcs, FRAME_CONTEXT* frame_context, MbModeInfo* mbmi,
356
                                       AomWriter* ec_writer, EcBlkStruct* blk_ptr, TxSize tx_size, uint32_t txb_index,
357
                                       uint32_t intraLumaDir, int32_t* coeff_buffer_ptr, COMPONENT_TYPE component_type,
358
                                       int16_t txb_skip_ctx, int16_t dc_sign_ctx, int16_t eob,
359
22.1k
                                       EntropyCodingContext* ec_ctx) {
360
22.1k
    int32_t      c;
361
22.1k
    const TxSize txs_ctx = get_txsize_entropy_ctx(tx_size);
362
22.1k
    TxType       tx_type = component_type == COMPONENT_LUMA ? blk_ptr->tx_type[txb_index] : blk_ptr->tx_type_uv;
363
364
22.1k
    assert(txs_ctx < TX_SIZES);
365
366
22.1k
    aom_write_symbol(ec_writer, eob == 0, frame_context->txb_skip_cdf[txs_ctx][txb_skip_ctx], 2);
367
368
22.1k
    assert(IMPLIES((component_type == 0 && eob == 0), tx_type == DCT_DCT));
369
22.1k
    assert(IMPLIES((is_inter_mode(mbmi->block_mi.mode) && component_type == 0 && eob == 0 && txb_index == 0),
370
22.1k
                   blk_ptr->tx_type_uv == DCT_DCT));
371
22.1k
    if (eob == 0) {
372
7.02k
        return 0;
373
7.02k
    }
374
15.1k
    if (component_type == COMPONENT_LUMA) {
375
5.15k
        av1_write_tx_type(ppcs, frame_context, mbmi, ec_writer, intraLumaDir, tx_type, tx_size);
376
5.15k
    }
377
15.1k
    int         eob_extra;
378
15.1k
    const int   eob_pt         = get_eob_pos_token(eob, &eob_extra);
379
15.1k
    const int   eob_multi_size = txsize_log2_minus4[tx_size];
380
15.1k
    const int   eob_multi_ctx  = (tx_type_to_class[tx_type] == TX_CLASS_2D) ? 0 : 1;
381
15.1k
    AomCdfProb* eob_flag_cdfs;
382
15.1k
    switch (eob_multi_size) {
383
6.72k
    case 0:
384
6.72k
        eob_flag_cdfs = frame_context->eob_flag_cdf16[component_type][eob_multi_ctx];
385
6.72k
        break;
386
0
    case 1:
387
0
        eob_flag_cdfs = frame_context->eob_flag_cdf32[component_type][eob_multi_ctx];
388
0
        break;
389
935
    case 2:
390
935
        eob_flag_cdfs = frame_context->eob_flag_cdf64[component_type][eob_multi_ctx];
391
935
        break;
392
0
    case 3:
393
0
        eob_flag_cdfs = frame_context->eob_flag_cdf128[component_type][eob_multi_ctx];
394
0
        break;
395
1.03k
    case 4:
396
1.03k
        eob_flag_cdfs = frame_context->eob_flag_cdf256[component_type][eob_multi_ctx];
397
1.03k
        break;
398
0
    case 5:
399
0
        eob_flag_cdfs = frame_context->eob_flag_cdf512[component_type][eob_multi_ctx];
400
0
        break;
401
6.42k
    case 6:
402
6.42k
    default:
403
6.42k
        eob_flag_cdfs = frame_context->eob_flag_cdf1024[component_type][eob_multi_ctx];
404
6.42k
        break;
405
15.1k
    }
406
15.1k
    aom_write_symbol(ec_writer, eob_pt - 1, eob_flag_cdfs, eob_multi_size + 5);
407
15.1k
    if (eob_pt > 2) {
408
0
        int cnt = eob_pt - 3;
409
0
        int bit = (eob_extra >> cnt) & 1;
410
0
        aom_write_symbol(ec_writer, bit, frame_context->eob_extra_cdf[txs_ctx][component_type][cnt], 2);
411
0
        aom_write_literal(ec_writer, eob_extra, cnt);
412
0
    }
413
414
15.1k
#if OPT_EC_DC_ONLY
415
    // Fast path for eob==1: single DC coefficient.
416
    // Contexts are known: coeff_ctx=0 (get_lower_levels_ctx_eob returns 0 for scan_idx=0),
417
    // br_ctx=0 (DC position with all-zero neighbors).
418
    // Skips txb_init_levels and get_nz_map_contexts entirely.
419
15.1k
    if (eob == 1) {
420
15.1k
        const int32_t v         = coeff_buffer_ptr[0];
421
15.1k
        int32_t       level     = ABS(v);
422
15.1k
        AomCdfProb*   dc_br_cdf = frame_context->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][component_type][0];
423
424
15.1k
        aom_write_symbol(
425
15.1k
            ec_writer, AOMMIN(level, 3) - 1, frame_context->coeff_base_eob_cdf[txs_ctx][component_type][0], 3);
426
15.1k
        if (level > NUM_BASE_LEVELS) {
427
13.6k
            int32_t base_range = level - 1 - NUM_BASE_LEVELS;
428
65.9k
            for (int32_t idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) {
429
53.1k
                const int32_t k = AOMMIN(base_range - idx, BR_CDF_SIZE - 1);
430
53.1k
                aom_write_symbol(ec_writer, k, dc_br_cdf, BR_CDF_SIZE);
431
53.1k
                if (k < BR_CDF_SIZE - 1) {
432
828
                    break;
433
828
                }
434
53.1k
            }
435
13.6k
        }
436
        // Sign (DC always uses dc_sign_cdf)
437
15.1k
        aom_write_symbol(ec_writer, (v < 0) ? 1 : 0, frame_context->dc_sign_cdf[component_type][dc_sign_ctx], 2);
438
15.1k
        if (level > COEFF_BASE_RANGE + NUM_BASE_LEVELS) {
439
12.7k
            write_golomb(ec_writer, level - COEFF_BASE_RANGE - 1 - NUM_BASE_LEVELS);
440
12.7k
        }
441
442
15.1k
        int32_t cul_level = AOMMIN(level, COEFF_CONTEXT_MASK);
443
15.1k
        set_dc_sign(&cul_level, coeff_buffer_ptr[0]);
444
15.1k
        return cul_level;
445
15.1k
    }
446
0
#endif
447
448
0
    const int bwl    = get_txb_bwl(tx_size);
449
0
    const int width  = get_txb_wide(tx_size);
450
0
    const int height = get_txb_high(tx_size);
451
452
0
    uint8_t* const levels = set_levels(ec_ctx->levels_buf, width, height);
453
0
    svt_av1_txb_init_levels(coeff_buffer_ptr, width, height, levels);
454
455
0
    const ScanOrder* const scan_order = get_scan_order(tx_size, tx_type);
456
0
    const int16_t* const   scan       = scan_order->scan;
457
458
0
    svt_av1_get_nz_map_contexts(levels, scan, eob, tx_size, tx_type_to_class[tx_type], ec_ctx->coeff_contexts);
459
460
0
#if OPT_EC_MERGE_COEFF_LOOPS
461
    // Merged approach: backward pass caches level/sign per coefficient,
462
    // accumulates cul_level, then a forward pass emits signs from cache.
463
    // Avoids re-reading coeff_buffer_ptr[scan[c]] in the forward pass.
464
0
    const TxClass tx_class   = tx_type_to_class[tx_type];
465
0
    const int32_t br_txs_ctx = AOMMIN(txs_ctx, TX_32X32);
466
467
    // Pre-compute CDF base pointers (loop-invariant outer dimensions)
468
0
    AomCdfProb(*base_cdf)[CDF_SIZE(4)]         = frame_context->coeff_base_cdf[txs_ctx][component_type];
469
0
    AomCdfProb(*br_cdf)[CDF_SIZE(BR_CDF_SIZE)] = frame_context->coeff_br_cdf[br_txs_ctx][component_type];
470
471
    // Cache: store level and sign for each scan position 0..eob-1
472
    // VLA sized to eob (guaranteed >= 2 here) instead of MAX_TX_SQUARE (4096)
473
    // to reduce stack usage from ~12KB to a few bytes for typical small blocks.
474
    // MSVC does not support C99 VLAs, so fall back to MAX_TX_SQUARE there.
475
#ifdef _MSC_VER
476
    int16_t cached_level[MAX_TX_SQUARE];
477
    uint8_t cached_sign[MAX_TX_SQUARE];
478
#else
479
0
    int16_t cached_level[eob];
480
0
    uint8_t cached_sign[eob];
481
0
#endif
482
0
    int32_t cul_level = 0;
483
484
    // Backward pass: base levels + base_range + cache
485
0
    {
486
0
        AomCdfProb(*base_eob_cdf)[CDF_SIZE(3)] = frame_context->coeff_base_eob_cdf[txs_ctx][component_type];
487
488
        // Peeled first iteration: c == eob - 1
489
0
        const int16_t pos       = scan[eob - 1];
490
0
        const int32_t v         = coeff_buffer_ptr[pos];
491
0
        const int16_t coeff_ctx = ec_ctx->coeff_contexts[pos];
492
0
        int32_t       level     = ABS(v);
493
494
0
        cached_level[eob - 1] = (int16_t)level;
495
0
        cached_sign[eob - 1]  = (v < 0) ? 1 : 0;
496
0
        cul_level += level;
497
498
0
        aom_write_symbol(ec_writer, AOMMIN(level, 3) - 1, base_eob_cdf[coeff_ctx], 3);
499
0
        if (level > NUM_BASE_LEVELS) {
500
0
            int32_t base_range = level - 1 - NUM_BASE_LEVELS;
501
0
            int16_t br_ctx     = get_br_ctx(levels, pos, bwl, tx_class);
502
0
            for (int32_t idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) {
503
0
                const int32_t k = AOMMIN(base_range - idx, BR_CDF_SIZE - 1);
504
0
                aom_write_symbol(ec_writer, k, br_cdf[br_ctx], BR_CDF_SIZE);
505
0
                if (k < BR_CDF_SIZE - 1) {
506
0
                    break;
507
0
                }
508
0
            }
509
0
        }
510
0
    }
511
0
    for (c = eob - 2; c >= 0; --c) {
512
0
        const int16_t pos       = scan[c];
513
0
        const int32_t v         = coeff_buffer_ptr[pos];
514
0
        const int16_t coeff_ctx = ec_ctx->coeff_contexts[pos];
515
0
        int32_t       level     = ABS(v);
516
517
0
        cached_level[c] = (int16_t)level;
518
0
        cached_sign[c]  = (v < 0) ? 1 : 0;
519
0
        cul_level += level;
520
521
0
        aom_write_symbol(ec_writer, AOMMIN(level, 3), base_cdf[coeff_ctx], 4);
522
0
        if (level > NUM_BASE_LEVELS) {
523
0
            int32_t base_range = level - 1 - NUM_BASE_LEVELS;
524
0
            int16_t br_ctx     = get_br_ctx(levels, pos, bwl, tx_class);
525
0
            for (int32_t idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) {
526
0
                const int32_t k = AOMMIN(base_range - idx, BR_CDF_SIZE - 1);
527
0
                aom_write_symbol(ec_writer, k, br_cdf[br_ctx], BR_CDF_SIZE);
528
0
                if (k < BR_CDF_SIZE - 1) {
529
0
                    break;
530
0
                }
531
0
            }
532
0
        }
533
0
    }
534
535
    // Forward pass: signs + golomb from cached data (no coeff_buffer_ptr re-read)
536
0
    for (c = 0; c < eob; ++c) {
537
0
        const int32_t level = cached_level[c];
538
0
        if (level) {
539
0
            if (c == 0) {
540
0
                aom_write_symbol(ec_writer, cached_sign[c], frame_context->dc_sign_cdf[component_type][dc_sign_ctx], 2);
541
0
            } else {
542
0
                aom_write_bit(ec_writer, cached_sign[c]);
543
0
            }
544
0
            if (level > COEFF_BASE_RANGE + NUM_BASE_LEVELS) {
545
0
                write_golomb(ec_writer, level - COEFF_BASE_RANGE - 1 - NUM_BASE_LEVELS);
546
0
            }
547
0
        }
548
0
    }
549
550
0
    cul_level = AOMMIN(COEFF_CONTEXT_MASK, cul_level);
551
0
    set_dc_sign(&cul_level, coeff_buffer_ptr[0]);
552
0
    return cul_level;
553
#else
554
    // Pre-compute CDF base pointers (loop-invariant outer dimensions)
555
    AomCdfProb(*base_cdf)[CDF_SIZE(4)]         = frame_context->coeff_base_cdf[txs_ctx][component_type];
556
    AomCdfProb(*base_eob_cdf)[CDF_SIZE(3)]     = frame_context->coeff_base_eob_cdf[txs_ctx][component_type];
557
    AomCdfProb(*br_cdf)[CDF_SIZE(BR_CDF_SIZE)] = frame_context->coeff_br_cdf[AOMMIN(txs_ctx, TX_32X32)][component_type];
558
    for (c = eob - 1; c >= 0; --c) {
559
        const int16_t pos       = scan[c];
560
        const int32_t v         = coeff_buffer_ptr[pos];
561
        const int16_t coeff_ctx = ec_ctx->coeff_contexts[pos];
562
        int32_t       level     = ABS(v);
563
564
        if (c == eob - 1) {
565
            aom_write_symbol(ec_writer, AOMMIN(level, 3) - 1, base_eob_cdf[coeff_ctx], 3);
566
        } else {
567
            aom_write_symbol(ec_writer, AOMMIN(level, 3), base_cdf[coeff_ctx], 4);
568
        }
569
        if (level > NUM_BASE_LEVELS) {
570
            // level is above 1.
571
            int32_t base_range = level - 1 - NUM_BASE_LEVELS;
572
            int16_t br_ctx     = get_br_ctx(levels, pos, bwl, tx_type_to_class[tx_type]);
573
            for (int32_t idx = 0; idx < COEFF_BASE_RANGE; idx += BR_CDF_SIZE - 1) {
574
                const int32_t k = AOMMIN(base_range - idx, BR_CDF_SIZE - 1);
575
                aom_write_symbol(ec_writer, k, br_cdf[br_ctx], BR_CDF_SIZE);
576
                if (k < BR_CDF_SIZE - 1) {
577
                    break;
578
                }
579
            }
580
        }
581
    }
582
    // Loop to code all signs in the transform block,
583
    // starting with the sign of DC (if applicable)
584
585
    int32_t cul_level = 0;
586
    for (c = 0; c < eob; ++c) {
587
        const int16_t pos   = scan[c];
588
        const int32_t v     = coeff_buffer_ptr[pos];
589
        int32_t       level = ABS(v);
590
        cul_level += level;
591
592
        const int32_t sign = (v < 0) ? 1 : 0;
593
        if (level) {
594
            if (c == 0) {
595
                aom_write_symbol(ec_writer, sign, frame_context->dc_sign_cdf[component_type][dc_sign_ctx], 2);
596
            } else {
597
                aom_write_bit(ec_writer, sign);
598
            }
599
            if (level > COEFF_BASE_RANGE + NUM_BASE_LEVELS) {
600
                write_golomb(ec_writer, level - COEFF_BASE_RANGE - 1 - NUM_BASE_LEVELS);
601
            }
602
        }
603
    }
604
605
    cul_level = AOMMIN(COEFF_CONTEXT_MASK, cul_level);
606
    // DC value
607
    set_dc_sign(&cul_level, coeff_buffer_ptr[0]);
608
    return cul_level;
609
#endif
610
15.1k
}
611
612
static EbErrorType av1_encode_tx_coef_y(PictureControlSet* pcs, EntropyCodingContext* ec_ctx,
613
                                        FRAME_CONTEXT* frame_context, AomWriter* ec_writer, MbModeInfo* mbmi,
614
                                        EcBlkStruct* blk_ptr, uint32_t blk_org_x, uint32_t blk_org_y,
615
                                        uint32_t intraLumaDir, BlockSize plane_bsize, EbPictureBufferDesc* coeff_ptr,
616
1.97k
                                        NeighborArrayUnit* luma_dc_sign_level_coeff_na) {
617
1.97k
    EbErrorType     return_error = EB_ErrorNone;
618
1.97k
    const bool      is_inter     = is_inter_mode(mbmi->block_mi.mode) || mbmi->block_mi.use_intrabc;
619
1.97k
    const BlockSize bsize        = mbmi->bsize;
620
1.97k
    const uint8_t   tx_depth     = mbmi->block_mi.tx_depth;
621
1.97k
    const uint16_t  txb_count    = tx_blocks_per_depth[bsize][tx_depth];
622
1.97k
    const TxSize    tx_size      = tx_depth_to_tx_size[tx_depth][bsize];
623
1.97k
    const int       tx_width     = tx_size_wide[tx_size];
624
1.97k
    const int       tx_height    = tx_size_high[tx_size];
625
626
9.89k
    for (uint16_t txb_itr = 0; txb_itr < txb_count; txb_itr++) {
627
        // Hoist tx_org lookup: same Position is used by both svt_aom_get_txb_ctx and the NA write.
628
7.91k
        const Position org  = tx_org[bsize][is_inter][tx_depth][txb_itr];
629
7.91k
        const uint32_t tx_x = blk_org_x + org.x;
630
7.91k
        const uint32_t tx_y = blk_org_y + org.y;
631
632
7.91k
        int32_t* coeff_buffer = (int32_t*)coeff_ptr->y_buffer + ec_ctx->coded_area_sb;
633
634
7.91k
        int16_t txb_skip_ctx = 0;
635
7.91k
        int16_t dc_sign_ctx  = 0;
636
7.91k
        svt_aom_get_txb_ctx(pcs,
637
7.91k
                            COMPONENT_LUMA,
638
7.91k
                            luma_dc_sign_level_coeff_na,
639
7.91k
                            tx_x,
640
7.91k
                            tx_y,
641
7.91k
                            plane_bsize,
642
7.91k
                            tx_size,
643
7.91k
                            &txb_skip_ctx,
644
7.91k
                            &dc_sign_ctx);
645
646
7.91k
        int32_t cul_level_y = av1_write_coeffs_txb_1d(pcs->ppcs,
647
7.91k
                                                      frame_context,
648
7.91k
                                                      mbmi,
649
7.91k
                                                      ec_writer,
650
7.91k
                                                      blk_ptr,
651
7.91k
                                                      tx_size,
652
7.91k
                                                      txb_itr,
653
7.91k
                                                      intraLumaDir,
654
7.91k
                                                      coeff_buffer,
655
7.91k
                                                      COMPONENT_LUMA,
656
7.91k
                                                      txb_skip_ctx,
657
7.91k
                                                      dc_sign_ctx,
658
7.91k
                                                      blk_ptr->eob.y[txb_itr],
659
7.91k
                                                      ec_ctx);
660
661
        // Update the luma Dc Sign Level Coeff Neighbor Array
662
7.91k
        uint8_t dc_sign_level_coeff = (uint8_t)cul_level_y;
663
7.91k
        svt_aom_neighbor_array_unit_mode_write_pu(luma_dc_sign_level_coeff_na,
664
7.91k
                                                  &dc_sign_level_coeff,
665
7.91k
                                                  tx_x,
666
7.91k
                                                  tx_y,
667
7.91k
                                                  tx_width,
668
7.91k
                                                  tx_height,
669
7.91k
                                                  NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
670
671
7.91k
        ec_ctx->coded_area_sb += tx_width * tx_height;
672
7.91k
    }
673
674
1.97k
    return return_error;
675
1.97k
}
676
677
static void av1_encode_tx_coef_uv(PictureControlSet* pcs, EntropyCodingContext* ec_ctx, FRAME_CONTEXT* frame_context,
678
                                  AomWriter* ec_writer, EcBlkStruct* blk_ptr, uint32_t blk_org_x, uint32_t blk_org_y,
679
                                  uint32_t intraLumaDir, EbPictureBufferDesc* coeff_ptr,
680
                                  NeighborArrayUnit* cr_dc_sign_level_coeff_na,
681
1.97k
                                  NeighborArrayUnit* cb_dc_sign_level_coeff_na) {
682
1.97k
    MbModeInfo* const mbmi   = ec_ctx->mbmi;
683
1.97k
    const BlockSize   bsize  = mbmi->bsize;
684
1.97k
    const bool        has_uv = is_chroma_reference(blk_org_y >> 2, blk_org_x >> 2, bsize, 1, 1);
685
686
1.97k
    if (!has_uv) {
687
0
        return;
688
0
    }
689
1.97k
    const int32_t   is_inter       = is_inter_mode(mbmi->block_mi.mode) || mbmi->block_mi.use_intrabc;
690
1.97k
    const BlockSize bsize_uv       = get_plane_block_size(bsize, 1, 1);
691
1.97k
    const uint8_t   tx_depth       = mbmi->block_mi.tx_depth;
692
1.97k
    const TxSize    chroma_tx_size = av1_get_max_uv_txsize(bsize, 1, 1);
693
1.97k
    const int       tx_width_uv    = tx_size_wide[chroma_tx_size];
694
1.97k
    const int       tx_height_uv   = tx_size_high[chroma_tx_size];
695
1.97k
    const unsigned  txb_count      = 1;
696
697
3.95k
    for (unsigned tx_index = 0; tx_index < txb_count; ++tx_index) {
698
        // Hoist tx_org lookup + ROUND_UV: reused by 4 sites below.
699
1.97k
        const Position org  = tx_org[bsize][is_inter][tx_depth][tx_index];
700
1.97k
        const uint32_t uv_x = ROUND_UV(blk_org_x + org.x) >> 1;
701
1.97k
        const uint32_t uv_y = ROUND_UV(blk_org_y + org.y) >> 1;
702
703
        // cb
704
1.97k
        int32_t* coeff_buffer = (int32_t*)coeff_ptr->u_buffer + ec_ctx->coded_area_sb_uv;
705
1.97k
        int16_t  txb_skip_ctx = 0;
706
1.97k
        int16_t  dc_sign_ctx  = 0;
707
708
1.97k
        svt_aom_get_txb_ctx(pcs,
709
1.97k
                            COMPONENT_CHROMA,
710
1.97k
                            cb_dc_sign_level_coeff_na,
711
1.97k
                            uv_x,
712
1.97k
                            uv_y,
713
1.97k
                            bsize_uv,
714
1.97k
                            chroma_tx_size,
715
1.97k
                            &txb_skip_ctx,
716
1.97k
                            &dc_sign_ctx);
717
718
1.97k
        int32_t cul_level_cb = av1_write_coeffs_txb_1d(pcs->ppcs,
719
1.97k
                                                       frame_context,
720
1.97k
                                                       mbmi,
721
1.97k
                                                       ec_writer,
722
1.97k
                                                       blk_ptr,
723
1.97k
                                                       chroma_tx_size,
724
1.97k
                                                       tx_index,
725
1.97k
                                                       intraLumaDir,
726
1.97k
                                                       coeff_buffer,
727
1.97k
                                                       COMPONENT_CHROMA,
728
1.97k
                                                       txb_skip_ctx,
729
1.97k
                                                       dc_sign_ctx,
730
1.97k
                                                       blk_ptr->eob.u[tx_index],
731
1.97k
                                                       ec_ctx);
732
733
        // cr
734
1.97k
        coeff_buffer = (int32_t*)coeff_ptr->v_buffer + ec_ctx->coded_area_sb_uv;
735
1.97k
        txb_skip_ctx = 0;
736
1.97k
        dc_sign_ctx  = 0;
737
738
1.97k
        svt_aom_get_txb_ctx(pcs,
739
1.97k
                            COMPONENT_CHROMA,
740
1.97k
                            cr_dc_sign_level_coeff_na,
741
1.97k
                            uv_x,
742
1.97k
                            uv_y,
743
1.97k
                            bsize_uv,
744
1.97k
                            chroma_tx_size,
745
1.97k
                            &txb_skip_ctx,
746
1.97k
                            &dc_sign_ctx);
747
748
1.97k
        int32_t cul_level_cr = av1_write_coeffs_txb_1d(pcs->ppcs,
749
1.97k
                                                       frame_context,
750
1.97k
                                                       mbmi,
751
1.97k
                                                       ec_writer,
752
1.97k
                                                       blk_ptr,
753
1.97k
                                                       chroma_tx_size,
754
1.97k
                                                       tx_index,
755
1.97k
                                                       intraLumaDir,
756
1.97k
                                                       coeff_buffer,
757
1.97k
                                                       COMPONENT_CHROMA,
758
1.97k
                                                       txb_skip_ctx,
759
1.97k
                                                       dc_sign_ctx,
760
1.97k
                                                       blk_ptr->eob.v[tx_index],
761
1.97k
                                                       ec_ctx);
762
        // Update the cb Dc Sign Level Coeff Neighbor Array
763
1.97k
        uint8_t dc_sign_level_coeff = (uint8_t)cul_level_cb;
764
1.97k
        svt_aom_neighbor_array_unit_mode_write_pu(cb_dc_sign_level_coeff_na,
765
1.97k
                                                  &dc_sign_level_coeff,
766
1.97k
                                                  uv_x,
767
1.97k
                                                  uv_y,
768
1.97k
                                                  tx_width_uv,
769
1.97k
                                                  tx_height_uv,
770
1.97k
                                                  NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
771
        // Update the cr DC Sign Level Coeff Neighbor Array
772
1.97k
        dc_sign_level_coeff = (uint8_t)cul_level_cr;
773
1.97k
        svt_aom_neighbor_array_unit_mode_write_pu(cr_dc_sign_level_coeff_na,
774
1.97k
                                                  &dc_sign_level_coeff,
775
1.97k
                                                  uv_x,
776
1.97k
                                                  uv_y,
777
1.97k
                                                  tx_width_uv,
778
1.97k
                                                  tx_height_uv,
779
1.97k
                                                  NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
780
781
1.97k
        ec_ctx->coded_area_sb_uv += tx_width_uv * tx_height_uv;
782
1.97k
    }
783
1.97k
}
784
785
/************************************
786
******* Av1EncodeTuCoeff
787
**************************************/
788
static EbErrorType av1_encode_coeff_1d(PictureControlSet* pcs, EntropyCodingContext* ec_ctx,
789
                                       FRAME_CONTEXT* frame_context, AomWriter* ec_writer, EcBlkStruct* blk_ptr,
790
                                       uint32_t blk_org_x, uint32_t blk_org_y, uint32_t intraLumaDir,
791
                                       BlockSize luma_bsize, EbPictureBufferDesc* coeff_ptr,
792
                                       NeighborArrayUnit* luma_dc_sign_level_coeff_na,
793
                                       NeighborArrayUnit* cr_dc_sign_level_coeff_na,
794
5.40k
                                       NeighborArrayUnit* cb_dc_sign_level_coeff_na) {
795
5.40k
    EbErrorType       return_error = EB_ErrorNone;
796
5.40k
    MbModeInfo* const mbmi         = ec_ctx->mbmi;
797
5.40k
    const int32_t     is_inter     = is_inter_mode(mbmi->block_mi.mode) || mbmi->block_mi.use_intrabc;
798
5.40k
    if (mbmi->block_mi.tx_depth) {
799
1.97k
        av1_encode_tx_coef_y(pcs,
800
1.97k
                             ec_ctx,
801
1.97k
                             frame_context,
802
1.97k
                             ec_writer,
803
1.97k
                             mbmi,
804
1.97k
                             blk_ptr,
805
1.97k
                             blk_org_x,
806
1.97k
                             blk_org_y,
807
1.97k
                             intraLumaDir,
808
1.97k
                             luma_bsize,
809
1.97k
                             coeff_ptr,
810
1.97k
                             luma_dc_sign_level_coeff_na);
811
812
1.97k
        av1_encode_tx_coef_uv(pcs,
813
1.97k
                              ec_ctx,
814
1.97k
                              frame_context,
815
1.97k
                              ec_writer,
816
1.97k
                              blk_ptr,
817
1.97k
                              blk_org_x,
818
1.97k
                              blk_org_y,
819
1.97k
                              intraLumaDir,
820
1.97k
                              coeff_ptr,
821
1.97k
                              cr_dc_sign_level_coeff_na,
822
1.97k
                              cb_dc_sign_level_coeff_na);
823
3.43k
    } else {
824
        // Transform partitioning free path (except the 128x128 case).
825
        // tx_depth is 0 in this branch.
826
3.43k
        int32_t cul_level_y, cul_level_cb = 0, cul_level_cr = 0;
827
828
3.43k
        const bool     has_uv       = is_chroma_reference(blk_org_y >> 2, blk_org_x >> 2, luma_bsize, 1, 1);
829
3.43k
        const uint8_t  tx_depth     = 0;
830
3.43k
        const uint16_t txb_count    = tx_blocks_per_depth[luma_bsize][tx_depth];
831
3.43k
        const TxSize   tx_size      = tx_depth_to_tx_size[tx_depth][luma_bsize];
832
3.43k
        const int      tx_width     = tx_size_wide[tx_size];
833
3.43k
        const int      tx_height    = tx_size_high[tx_size];
834
3.43k
        const TxSize   tx_size_uv   = av1_get_max_uv_txsize(luma_bsize, 1, 1);
835
3.43k
        const int      tx_width_uv  = tx_size_wide[tx_size_uv];
836
3.43k
        const int      tx_height_uv = tx_size_high[tx_size_uv];
837
        // bsize_uv is only consumed under `has_uv`, but hoisting unconditionally is cheaper than branching twice.
838
3.43k
        const BlockSize bsize_uv = has_uv ? get_plane_block_size(luma_bsize, 1, 1) : 0;
839
6.86k
        for (uint8_t txb_itr = 0; txb_itr < txb_count; txb_itr++) {
840
            // Hoist tx_org + ROUND_UV: reused by up to 7 sites per iteration.
841
3.43k
            const Position org  = tx_org[luma_bsize][is_inter][tx_depth][txb_itr];
842
3.43k
            const uint32_t tx_x = blk_org_x + org.x;
843
3.43k
            const uint32_t tx_y = blk_org_y + org.y;
844
3.43k
            const uint32_t uv_x = ROUND_UV(tx_x) >> 1;
845
3.43k
            const uint32_t uv_y = ROUND_UV(tx_y) >> 1;
846
847
3.43k
            int32_t* coeff_buffer = (int32_t*)coeff_ptr->y_buffer + ec_ctx->coded_area_sb;
848
849
3.43k
            {
850
3.43k
                int16_t txb_skip_ctx = 0;
851
3.43k
                int16_t dc_sign_ctx  = 0;
852
853
3.43k
                svt_aom_get_txb_ctx(pcs,
854
3.43k
                                    COMPONENT_LUMA,
855
3.43k
                                    luma_dc_sign_level_coeff_na,
856
3.43k
                                    tx_x,
857
3.43k
                                    tx_y,
858
3.43k
                                    luma_bsize,
859
3.43k
                                    tx_size,
860
3.43k
                                    &txb_skip_ctx,
861
3.43k
                                    &dc_sign_ctx);
862
863
3.43k
                cul_level_y = av1_write_coeffs_txb_1d(pcs->ppcs,
864
3.43k
                                                      frame_context,
865
3.43k
                                                      mbmi,
866
3.43k
                                                      ec_writer,
867
3.43k
                                                      blk_ptr,
868
3.43k
                                                      tx_size,
869
3.43k
                                                      txb_itr,
870
3.43k
                                                      intraLumaDir,
871
3.43k
                                                      coeff_buffer,
872
3.43k
                                                      COMPONENT_LUMA,
873
3.43k
                                                      txb_skip_ctx,
874
3.43k
                                                      dc_sign_ctx,
875
3.43k
                                                      blk_ptr->eob.y[txb_itr],
876
3.43k
                                                      ec_ctx);
877
3.43k
            }
878
879
3.43k
            if (has_uv) {
880
                // cb
881
3.43k
                coeff_buffer = (int32_t*)coeff_ptr->u_buffer + ec_ctx->coded_area_sb_uv;
882
3.43k
                {
883
3.43k
                    int16_t txb_skip_ctx = 0;
884
3.43k
                    int16_t dc_sign_ctx  = 0;
885
886
3.43k
                    svt_aom_get_txb_ctx(pcs,
887
3.43k
                                        COMPONENT_CHROMA,
888
3.43k
                                        cb_dc_sign_level_coeff_na,
889
3.43k
                                        uv_x,
890
3.43k
                                        uv_y,
891
3.43k
                                        bsize_uv,
892
3.43k
                                        tx_size_uv,
893
3.43k
                                        &txb_skip_ctx,
894
3.43k
                                        &dc_sign_ctx);
895
896
3.43k
                    cul_level_cb = av1_write_coeffs_txb_1d(pcs->ppcs,
897
3.43k
                                                           frame_context,
898
3.43k
                                                           mbmi,
899
3.43k
                                                           ec_writer,
900
3.43k
                                                           blk_ptr,
901
3.43k
                                                           tx_size_uv,
902
3.43k
                                                           txb_itr,
903
3.43k
                                                           intraLumaDir,
904
3.43k
                                                           coeff_buffer,
905
3.43k
                                                           COMPONENT_CHROMA,
906
3.43k
                                                           txb_skip_ctx,
907
3.43k
                                                           dc_sign_ctx,
908
3.43k
                                                           blk_ptr->eob.u[txb_itr],
909
3.43k
                                                           ec_ctx);
910
3.43k
                }
911
912
                // cr
913
3.43k
                coeff_buffer = (int32_t*)coeff_ptr->v_buffer + ec_ctx->coded_area_sb_uv;
914
3.43k
                {
915
3.43k
                    int16_t txb_skip_ctx = 0;
916
3.43k
                    int16_t dc_sign_ctx  = 0;
917
918
3.43k
                    svt_aom_get_txb_ctx(pcs,
919
3.43k
                                        COMPONENT_CHROMA,
920
3.43k
                                        cr_dc_sign_level_coeff_na,
921
3.43k
                                        uv_x,
922
3.43k
                                        uv_y,
923
3.43k
                                        bsize_uv,
924
3.43k
                                        tx_size_uv,
925
3.43k
                                        &txb_skip_ctx,
926
3.43k
                                        &dc_sign_ctx);
927
928
3.43k
                    cul_level_cr = av1_write_coeffs_txb_1d(pcs->ppcs,
929
3.43k
                                                           frame_context,
930
3.43k
                                                           mbmi,
931
3.43k
                                                           ec_writer,
932
3.43k
                                                           blk_ptr,
933
3.43k
                                                           tx_size_uv,
934
3.43k
                                                           txb_itr,
935
3.43k
                                                           intraLumaDir,
936
3.43k
                                                           coeff_buffer,
937
3.43k
                                                           COMPONENT_CHROMA,
938
3.43k
                                                           txb_skip_ctx,
939
3.43k
                                                           dc_sign_ctx,
940
3.43k
                                                           blk_ptr->eob.v[txb_itr],
941
3.43k
                                                           ec_ctx);
942
3.43k
                }
943
3.43k
            }
944
945
            // Update the luma Dc Sign Level Coeff Neighbor Array
946
3.43k
            uint8_t dc_sign_level_coeff = (uint8_t)cul_level_y;
947
3.43k
            svt_aom_neighbor_array_unit_mode_write_pu(luma_dc_sign_level_coeff_na,
948
3.43k
                                                      &dc_sign_level_coeff,
949
3.43k
                                                      tx_x,
950
3.43k
                                                      tx_y,
951
3.43k
                                                      tx_width,
952
3.43k
                                                      tx_height,
953
3.43k
                                                      NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
954
955
            // Update the cb Dc Sign Level Coeff Neighbor Array
956
3.43k
            if (has_uv) {
957
3.43k
                dc_sign_level_coeff = (uint8_t)cul_level_cb;
958
3.43k
                svt_aom_neighbor_array_unit_mode_write_pu(cb_dc_sign_level_coeff_na,
959
3.43k
                                                          &dc_sign_level_coeff,
960
3.43k
                                                          uv_x,
961
3.43k
                                                          uv_y,
962
3.43k
                                                          tx_width_uv,
963
3.43k
                                                          tx_height_uv,
964
3.43k
                                                          NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
965
                // Update the cr DC Sign Level Coeff Neighbor Array
966
3.43k
                dc_sign_level_coeff = (uint8_t)cul_level_cr;
967
3.43k
                svt_aom_neighbor_array_unit_mode_write_pu(cr_dc_sign_level_coeff_na,
968
3.43k
                                                          &dc_sign_level_coeff,
969
3.43k
                                                          uv_x,
970
3.43k
                                                          uv_y,
971
3.43k
                                                          tx_width_uv,
972
3.43k
                                                          tx_height_uv,
973
3.43k
                                                          NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
974
3.43k
                ec_ctx->coded_area_sb_uv += tx_width_uv * tx_height_uv;
975
3.43k
            }
976
3.43k
            ec_ctx->coded_area_sb += tx_width * tx_height;
977
3.43k
        }
978
3.43k
    }
979
5.40k
    return return_error;
980
5.40k
}
981
982
/*********************************************************************
983
* encode_partition_av1
984
*   Encodes the partition
985
*********************************************************************/
986
// Return the number of elements in the partition CDF when
987
// partitioning the (square) block with luma block size of bsize.
988
156k
int32_t svt_aom_partition_cdf_length(BlockSize bsize) {
989
156k
    if (bsize <= BLOCK_8X8) {
990
116k
        return PARTITION_TYPES;
991
116k
    } else if (bsize == BLOCK_128X128) {
992
0
        return EXT_PARTITION_TYPES - 2;
993
39.8k
    } else {
994
39.8k
        return EXT_PARTITION_TYPES;
995
39.8k
    }
996
156k
}
997
998
static void encode_partition_av1(PictureControlSet* pcs, FRAME_CONTEXT* frame_context, AomWriter* ec_writer,
999
                                 BlockSize bsize, PartitionType p, uint32_t blk_org_x, uint32_t blk_org_y,
1000
165k
                                 NeighborArrayUnit* partition_context_na) {
1001
165k
    const int32_t is_partition_point = bsize >= BLOCK_8X8;
1002
1003
165k
    if (!is_partition_point) {
1004
0
        return;
1005
0
    }
1006
1007
165k
    const int32_t hbs      = (mi_size_wide[bsize] << 2) >> 1;
1008
165k
    const int32_t has_rows = (blk_org_y + hbs) < pcs->ppcs->aligned_height;
1009
165k
    const int32_t has_cols = (blk_org_x + hbs) < pcs->ppcs->aligned_width;
1010
1011
165k
    const uint8_t above_byte = *svt_aom_na_top_ptr_pu(partition_context_na, blk_org_x);
1012
165k
    const uint8_t left_byte  = *svt_aom_na_left_ptr_pu(partition_context_na, blk_org_y);
1013
1014
165k
    uint32_t context_index = 0;
1015
1016
165k
    PartitionContextType above_ctx = (above_byte == INVALID_NEIGHBOR_DATA) ? 0 : (PartitionContextType)above_byte;
1017
165k
    PartitionContextType left_ctx  = (left_byte == INVALID_NEIGHBOR_DATA) ? 0 : (PartitionContextType)left_byte;
1018
1019
165k
    const int32_t bsl   = mi_size_wide_log2[bsize] - mi_size_wide_log2[BLOCK_8X8];
1020
165k
    int32_t       above = (above_ctx >> bsl) & 1, left = (left_ctx >> bsl) & 1;
1021
1022
165k
    assert(mi_size_wide_log2[bsize] == mi_size_high_log2[bsize]);
1023
165k
    assert(bsl >= 0);
1024
165k
    assert(p < CDF_SIZE(EXT_PARTITION_TYPES));
1025
1026
165k
    context_index = (left * 2 + above) + bsl * PARTITION_PLOFFSET;
1027
1028
165k
    if (!has_rows && !has_cols) {
1029
393
        assert(p == PARTITION_SPLIT);
1030
393
        return;
1031
393
    }
1032
1033
164k
    if (has_rows && has_cols) {
1034
156k
        aom_write_symbol(
1035
156k
            ec_writer, p, frame_context->partition_cdf[context_index], svt_aom_partition_cdf_length(bsize));
1036
156k
    } else if (!has_rows && has_cols) {
1037
3.88k
        AomCdfProb cdf[CDF_SIZE(2)];
1038
3.88k
        partition_gather_vert_alike(cdf, frame_context->partition_cdf[context_index], bsize);
1039
3.88k
        aom_write_symbol(ec_writer, p == PARTITION_SPLIT, cdf, 2);
1040
4.20k
    } else {
1041
4.20k
        AomCdfProb cdf[CDF_SIZE(2)];
1042
4.20k
        partition_gather_horz_alike(cdf, frame_context->partition_cdf[context_index], bsize);
1043
4.20k
        aom_write_symbol(ec_writer, p == PARTITION_SPLIT, cdf, 2);
1044
4.20k
    }
1045
1046
164k
    return;
1047
165k
}
1048
1049
121k
uint8_t av1_get_skip_context(const MacroBlockD* xd) {
1050
121k
    const MbModeInfo* const above_mi   = xd->above_mbmi;
1051
121k
    const MbModeInfo* const left_mi    = xd->left_mbmi;
1052
121k
    const uint8_t           above_skip = above_mi ? above_mi->block_mi.skip : 0;
1053
121k
    const uint8_t           left_skip  = left_mi ? left_mi->block_mi.skip : 0;
1054
121k
    return above_skip + left_skip;
1055
121k
}
1056
1057
/*********************************************************************
1058
 * encode_skip_coeff_av1
1059
 *   Encodes the skip coefficient flag
1060
 *********************************************************************/
1061
static void encode_skip_coeff_av1(EcBlkStruct* blk_ptr, FRAME_CONTEXT* frame_context, AomWriter* ec_writer,
1062
121k
                                  bool skip_coeff_flag) {
1063
    // TODO: need to code in syntax for segmentation map + skip
1064
121k
    uint8_t ctx = av1_get_skip_context(blk_ptr->av1xd);
1065
121k
    aom_write_symbol(ec_writer, skip_coeff_flag ? 1 : 0, frame_context->skip_cdfs[ctx], 2);
1066
121k
}
1067
1068
/* Get the contexts (left and top) for writing the intra luma mode for key frames. Intended to
1069
 * be used for key frame only. */
1070
242k
void svt_aom_get_kf_y_mode_ctx(const MacroBlockD* xd, uint8_t* above_ctx, uint8_t* left_ctx) {
1071
242k
    PredictionMode intra_luma_left_mode = DC_PRED;
1072
242k
    PredictionMode intra_luma_top_mode  = DC_PRED;
1073
242k
    if (xd->left_available) {
1074
        // When called for key frame, neighbouring mode should be intra
1075
203k
        assert(!is_inter_block(&xd->mi[-1]->block_mi) || is_intrabc_block(&xd->mi[-1]->block_mi));
1076
203k
        intra_luma_left_mode = xd->mi[-1]->block_mi.mode;
1077
203k
    }
1078
242k
    if (xd->up_available) {
1079
        // When called for key frame, neighbouring mode should be intra
1080
202k
        assert(!is_inter_block(&xd->mi[-xd->mi_stride]->block_mi) ||
1081
202k
               is_intrabc_block(&xd->mi[-xd->mi_stride]->block_mi));
1082
202k
        intra_luma_top_mode = xd->mi[-xd->mi_stride]->block_mi.mode;
1083
202k
    }
1084
1085
242k
    *above_ctx = intra_mode_context[intra_luma_top_mode];
1086
242k
    *left_ctx  = intra_mode_context[intra_luma_left_mode];
1087
242k
}
1088
1089
/*********************************************************************
1090
*   Encodes the Intra Luma Mode for a key frame
1091
*********************************************************************/
1092
static void encode_intra_luma_mode_kf_av1(FRAME_CONTEXT* frame_context, AomWriter* ec_writer, MbModeInfo* mbmi,
1093
121k
                                          EcBlkStruct* blk_ptr, BlockSize bsize, uint32_t luma_mode) {
1094
121k
    uint8_t top_context, left_context;
1095
121k
    svt_aom_get_kf_y_mode_ctx(blk_ptr->av1xd, &top_context, &left_context);
1096
121k
    aom_write_symbol(ec_writer, luma_mode, frame_context->kf_y_cdf[top_context][left_context], INTRA_MODES);
1097
1098
121k
    if (bsize >= BLOCK_8X8 && av1_is_directional_mode(mbmi->block_mi.mode)) {
1099
0
        aom_write_symbol(ec_writer,
1100
0
                         mbmi->block_mi.angle_delta[PLANE_TYPE_Y] + MAX_ANGLE_DELTA,
1101
0
                         frame_context->angle_delta_cdf[luma_mode - V_PRED],
1102
0
                         2 * MAX_ANGLE_DELTA + 1);
1103
0
    }
1104
1105
121k
    return;
1106
121k
}
1107
1108
/*********************************************************************
1109
* encode_intra_luma_mode_nonkey_av1
1110
*   Encodes the Intra Luma Mode for non Key frames
1111
*********************************************************************/
1112
static void encode_intra_luma_mode_nonkey_av1(FRAME_CONTEXT* frame_context, AomWriter* ec_writer, MbModeInfo* mbmi,
1113
0
                                              BlockSize bsize, uint32_t luma_mode) {
1114
0
    aom_write_symbol(ec_writer, luma_mode, frame_context->y_mode_cdf[eb_size_group_lookup[bsize]], INTRA_MODES);
1115
1116
0
    if (bsize >= BLOCK_8X8 && av1_is_directional_mode(mbmi->block_mi.mode)) {
1117
0
        aom_write_symbol(ec_writer,
1118
0
                         mbmi->block_mi.angle_delta[PLANE_TYPE_Y] + MAX_ANGLE_DELTA,
1119
0
                         frame_context->angle_delta_cdf[luma_mode - V_PRED],
1120
0
                         2 * MAX_ANGLE_DELTA + 1);
1121
0
    }
1122
1123
0
    return;
1124
0
}
1125
1126
0
static void write_cfl_alphas(FRAME_CONTEXT* const ec_ctx, int32_t idx, int32_t joint_sign, AomWriter* w) {
1127
0
    aom_write_symbol(w, joint_sign, ec_ctx->cfl_sign_cdf, CFL_JOINT_SIGNS);
1128
    // Magnitudes are only signaled for nonzero codes.
1129
0
    if (CFL_SIGN_U(joint_sign) != CFL_SIGN_ZERO) {
1130
0
        AomCdfProb* cdf_u = ec_ctx->cfl_alpha_cdf[CFL_CONTEXT_U(joint_sign)];
1131
0
        aom_write_symbol(w, CFL_IDX_U(idx), cdf_u, CFL_ALPHABET_SIZE);
1132
0
    }
1133
0
    if (CFL_SIGN_V(joint_sign) != CFL_SIGN_ZERO) {
1134
0
        AomCdfProb* cdf_v = ec_ctx->cfl_alpha_cdf[CFL_CONTEXT_V(joint_sign)];
1135
0
        aom_write_symbol(w, CFL_IDX_V(idx), cdf_v, CFL_ALPHABET_SIZE);
1136
0
    }
1137
0
}
1138
1139
/*********************************************************************
1140
* encode_intra_chroma_mode_av1
1141
*   Encodes the Intra Chroma Mode
1142
*********************************************************************/
1143
static void encode_intra_chroma_mode_av1(FRAME_CONTEXT* frame_context, AomWriter* ec_writer, MbModeInfo* mbmi,
1144
                                         BlockSize bsize, uint32_t luma_mode, uint32_t chroma_mode,
1145
121k
                                         uint8_t cflAllowed) {
1146
121k
    aom_write_symbol(
1147
121k
        ec_writer, chroma_mode, frame_context->uv_mode_cdf[cflAllowed][luma_mode], UV_INTRA_MODES - !cflAllowed);
1148
1149
121k
    if (chroma_mode == UV_CFL_PRED) {
1150
0
        write_cfl_alphas(frame_context, mbmi->block_mi.cfl_alpha_idx, mbmi->block_mi.cfl_alpha_signs, ec_writer);
1151
0
    }
1152
1153
121k
    if (bsize >= BLOCK_8X8 && av1_is_directional_mode(get_uv_mode(mbmi->block_mi.uv_mode))) {
1154
0
        aom_write_symbol(ec_writer,
1155
0
                         mbmi->block_mi.angle_delta[PLANE_TYPE_UV] + MAX_ANGLE_DELTA,
1156
0
                         frame_context->angle_delta_cdf[chroma_mode - V_PRED],
1157
0
                         2 * MAX_ANGLE_DELTA + 1);
1158
0
    }
1159
1160
121k
    return;
1161
121k
}
1162
1163
121k
uint8_t av1_get_skip_mode_context(const MacroBlockD* xd) {
1164
121k
    const MbModeInfo* const above_mi        = xd->above_mbmi;
1165
121k
    const MbModeInfo* const left_mi         = xd->left_mbmi;
1166
121k
    const int               above_skip_mode = above_mi ? above_mi->block_mi.skip_mode : 0;
1167
121k
    const int               left_skip_mode  = left_mi ? left_mi->block_mi.skip_mode : 0;
1168
121k
    return above_skip_mode + left_skip_mode;
1169
121k
}
1170
1171
/*********************************************************************
1172
 * encode_skip_mode_av1
1173
 *   Encodes the skip Mode flag
1174
 *********************************************************************/
1175
static void encode_skip_mode_av1(const EcBlkStruct* blk_ptr, FRAME_CONTEXT* frame_context, AomWriter* ec_writer,
1176
0
                                 bool skip_mode_flag) {
1177
    // TODO: not coded in syntax for skip mode/ref-frame/global-mv in segmentation map
1178
0
    const uint8_t context_index = av1_get_skip_mode_context(blk_ptr->av1xd);
1179
1180
0
    aom_write_symbol(ec_writer, skip_mode_flag ? 1 : 0, frame_context->skip_mode_cdfs[context_index], 2);
1181
0
}
1182
1183
/*******************************************************************************
1184
* The mode info data structure has a one element border above and to the
1185
* left of the entries corresponding to real macroblocks.
1186
* The prediction flags in these dummy entries are initialized to 0.
1187
* 0 - inter/inter, inter/--, --/inter, --/--
1188
* 1 - intra/inter, inter/intra
1189
* 2 - intra/--, --/intra
1190
* 3 - intra/intra
1191
 ******************************************************************************/
1192
121k
uint8_t svt_av1_get_intra_inter_context(const MacroBlockD* xd) {
1193
121k
    const MbModeInfo* const above_mbmi = xd->above_mbmi;
1194
121k
    const MbModeInfo* const left_mbmi  = xd->left_mbmi;
1195
121k
    const int               has_above  = xd->up_available;
1196
121k
    const int               has_left   = xd->left_available;
1197
1198
121k
    if (has_above && has_left) { // both edges available
1199
86.1k
        const int above_intra = !is_inter_block(&above_mbmi->block_mi);
1200
86.1k
        const int left_intra  = !is_inter_block(&left_mbmi->block_mi);
1201
18.4E
        return left_intra && above_intra ? 3 : left_intra || above_intra;
1202
86.1k
    } else if (has_above || has_left) { // one edge available
1203
30.3k
        return 2 * !is_inter_block(has_above ? &above_mbmi->block_mi : &left_mbmi->block_mi);
1204
30.3k
    } else {
1205
4.50k
        return 0;
1206
4.50k
    }
1207
121k
}
1208
1209
/*********************************************************************
1210
 * encode_pred_mode_av1
1211
 *   Encodes the Prediction Mode
1212
 *********************************************************************/
1213
static void write_is_inter(const EcBlkStruct* blk_ptr, FRAME_CONTEXT* frame_context, AomWriter* ec_writer,
1214
0
                           int32_t is_inter) {
1215
0
    const uint8_t ctx = svt_av1_get_intra_inter_context(blk_ptr->av1xd);
1216
0
    aom_write_symbol(ec_writer, is_inter, frame_context->intra_inter_cdf[ctx], 2);
1217
0
}
1218
1219
//****************************************************************************************************//
1220
1221
/*********************************************************************
1222
* svt_aom_motion_mode_allowed
1223
*   checks the motion modes that are allowed for the current block
1224
*********************************************************************/
1225
MotionMode svt_aom_motion_mode_allowed(const PictureControlSet* pcs, uint16_t num_proj_ref,
1226
                                       uint32_t overlappable_neighbors, const BlockSize bsize, MvReferenceFrame rf0,
1227
0
                                       MvReferenceFrame rf1, PredictionMode mode) {
1228
0
    FrameHeader* frm_hdr = &pcs->ppcs->frm_hdr;
1229
0
    if (!frm_hdr->is_motion_mode_switchable) {
1230
0
        return SIMPLE_TRANSLATION;
1231
0
    }
1232
1233
0
    if (frm_hdr->force_integer_mv == 0) {
1234
0
        const TransformationType gm_type = pcs->ppcs->global_motion[rf0].wmtype;
1235
0
        if (is_global_mv_block(mode, bsize, gm_type)) {
1236
0
            return SIMPLE_TRANSLATION;
1237
0
        }
1238
0
    }
1239
0
    if (is_motion_variation_allowed_bsize(bsize) && is_inter_singleref_mode(mode) && rf1 != INTRA_FRAME &&
1240
0
        !(rf1 > INTRA_FRAME)) // is_motion_variation_allowed_compound
1241
0
    {
1242
0
        if (overlappable_neighbors == 0) {
1243
0
            return SIMPLE_TRANSLATION;
1244
0
        }
1245
1246
0
        if (frm_hdr->allow_warped_motion &&
1247
            /* TODO(JS): when scale is added, put: !av1_is_scaled(&(xd->block_refs[0]->sf)) && */
1248
0
            num_proj_ref >= 1) {
1249
0
            if (frm_hdr->force_integer_mv) {
1250
0
                return OBMC_CAUSAL;
1251
0
            }
1252
0
            return WARPED_CAUSAL;
1253
0
        }
1254
0
        return OBMC_CAUSAL;
1255
0
    } else {
1256
0
        return SIMPLE_TRANSLATION;
1257
0
    }
1258
0
}
1259
1260
/*********************************************************************
1261
* write_motion_mode
1262
*   Encodes the Motion Mode (obmc or warped)
1263
*********************************************************************/
1264
static void write_motion_mode(FRAME_CONTEXT* frame_context, AomWriter* ec_writer, BlockSize bsize, MbModeInfo* mbmi,
1265
                              MotionMode motion_mode, MvReferenceFrame rf0, MvReferenceFrame rf1, EcBlkStruct* blk_ptr,
1266
0
                              PictureControlSet* pcs) {
1267
0
    MotionMode last_motion_mode_allowed = svt_aom_motion_mode_allowed(
1268
0
        pcs, mbmi->block_mi.num_proj_ref, blk_ptr->overlappable_neighbors, bsize, rf0, rf1, mbmi->block_mi.mode);
1269
0
    switch (last_motion_mode_allowed) {
1270
0
    case SIMPLE_TRANSLATION:
1271
0
        break;
1272
0
    case OBMC_CAUSAL:
1273
0
        aom_write_symbol(ec_writer, motion_mode == OBMC_CAUSAL, frame_context->obmc_cdf[bsize], 2);
1274
0
        break;
1275
0
    default:
1276
0
        aom_write_symbol(ec_writer, motion_mode, frame_context->motion_mode_cdf[bsize], MOTION_MODES);
1277
0
    }
1278
1279
0
    return;
1280
0
}
1281
1282
//****************************************************************************************************//
1283
1284
4.53k
EbErrorType svt_aom_encode_slice_finish(EntropyCoder* ec) {
1285
4.53k
    EbErrorType return_error = EB_ErrorNone;
1286
1287
4.53k
    aom_stop_encode(&ec->ec_writer);
1288
1289
4.53k
    return return_error;
1290
4.53k
}
1291
1292
4.53k
EbErrorType svt_aom_reset_entropy_coder(EncodeContext* enc_ctx, EntropyCoder* ec, uint32_t qp, SliceType slice_type) {
1293
4.53k
    EbErrorType return_error = EB_ErrorNone;
1294
1295
4.53k
    (void)enc_ctx;
1296
4.53k
    (void)slice_type;
1297
4.53k
    svt_av1_default_coef_probs(ec->fc, qp);
1298
4.53k
    svt_aom_init_mode_probs(ec->fc);
1299
1300
4.53k
    return return_error;
1301
4.53k
}
1302
1303
4.53k
static void entropy_tile_info_dctor(EbPtr p) {
1304
4.53k
    EntropyTileInfo* obj = (EntropyTileInfo*)p;
1305
4.53k
    EB_DELETE(obj->ec);
1306
4.53k
}
1307
1308
4.53k
EbErrorType svt_aom_entropy_tile_info_ctor(EntropyTileInfo* eti, uint32_t buf_size) {
1309
4.53k
    EbErrorType return_error = EB_ErrorNone;
1310
4.53k
    eti->dctor               = entropy_tile_info_dctor;
1311
4.53k
    EB_NEW(eti->ec, svt_aom_entropy_coder_ctor, buf_size);
1312
4.53k
    eti->entropy_coding_tile_done = false;
1313
4.53k
    return return_error;
1314
4.53k
}
1315
1316
2.15k
static void bitstream_dctor(EbPtr p) {
1317
2.15k
    Bitstream* obj = (Bitstream*)p;
1318
2.15k
    EB_DELETE(obj->output_bitstream_ptr);
1319
2.15k
}
1320
1321
2.15k
EbErrorType svt_aom_bitstream_ctor(Bitstream* bitstream_ptr, uint32_t buffer_size) {
1322
2.15k
    bitstream_ptr->dctor = bitstream_dctor;
1323
2.15k
    EB_NEW(bitstream_ptr->output_bitstream_ptr, svt_aom_output_bitstream_unit_ctor, buffer_size);
1324
2.15k
    return EB_ErrorNone;
1325
2.15k
}
1326
1327
430
void svt_aom_bitstream_reset(Bitstream* bitstream_ptr) {
1328
430
    svt_aom_output_bitstream_reset(bitstream_ptr->output_bitstream_ptr);
1329
430
}
1330
1331
860
int svt_aom_bitstream_get_bytes_count(const Bitstream* bitstream_ptr) {
1332
860
    const OutputBitstreamUnit* unit = bitstream_ptr->output_bitstream_ptr;
1333
860
    return (int)(unit->buffer_av1 - unit->buffer_begin_av1);
1334
860
}
1335
1336
430
void svt_aom_bitstream_copy(const Bitstream* bitstream_ptr, void* dest, int size) {
1337
430
    const OutputBitstreamUnit* unit = bitstream_ptr->output_bitstream_ptr;
1338
430
    svt_memcpy(dest, unit->buffer_begin_av1, size);
1339
430
}
1340
1341
4.53k
static void entropy_coder_dctor(EbPtr p) {
1342
4.53k
    EntropyCoder*        obj                  = (EntropyCoder*)p;
1343
4.53k
    OutputBitstreamUnit* output_bitstream_ptr = (OutputBitstreamUnit*)obj->ec_output_bitstream_ptr;
1344
4.53k
    EB_DELETE(output_bitstream_ptr);
1345
    // EC buffer is owned by OutputBitstreamUnit and freed above; just NULL out.
1346
4.53k
    obj->ec_writer.ec.buf = NULL;
1347
4.53k
    obj->ec_writer.ec.ptr = NULL;
1348
4.53k
    EB_FREE(obj->fc);
1349
4.53k
}
1350
1351
4.53k
EbErrorType svt_aom_entropy_coder_ctor(EntropyCoder* ec, uint32_t buffer_size) {
1352
4.53k
    OutputBitstreamUnit* output_bitstream_ptr;
1353
1354
4.53k
    ec->dctor = entropy_coder_dctor;
1355
1356
4.53k
    EB_MALLOC_OBJECT(ec->fc);
1357
1358
4.53k
    EB_NEW(output_bitstream_ptr, svt_aom_output_bitstream_unit_ctor, buffer_size);
1359
4.53k
    ec->ec_output_bitstream_ptr = output_bitstream_ptr;
1360
1361
    // EC does not allocate its own buffer; it borrows from OutputBitstreamUnit
1362
    // via aom_start_encode() each frame.
1363
4.53k
    svt_od_ec_enc_init(&ec->ec_writer.ec);
1364
1365
4.53k
    return EB_ErrorNone;
1366
4.53k
}
1367
1368
//*******************************************************************************************//
1369
//*******************************************************************************************//
1370
//*******************************************************************************************//
1371
//*******************************************************************************************//
1372
// aom_integer.c
1373
static const size_t   k_maximum_leb_128_size  = 8;
1374
static const uint64_t k_maximum_leb_128_value = 0xFFFFFFFFFFFFFF; // 2 ^ 56 - 1
1375
1376
2.15k
size_t svt_aom_uleb_size_in_bytes(uint64_t value) {
1377
2.15k
    size_t size = 0;
1378
2.82k
    do {
1379
2.82k
        ++size;
1380
2.82k
    } while ((value >>= 7) != 0);
1381
2.15k
    return size;
1382
2.15k
}
1383
1384
1.29k
int32_t svt_aom_uleb_encode(uint64_t value, size_t available, uint8_t* coded_value, size_t* coded_size) {
1385
1.29k
    const size_t leb_size = svt_aom_uleb_size_in_bytes(value);
1386
1.29k
    if (value > k_maximum_leb_128_value || leb_size > k_maximum_leb_128_size || leb_size > available || !coded_value ||
1387
1.29k
        !coded_size) {
1388
0
        return -1;
1389
0
    }
1390
1391
2.91k
    for (size_t i = 0; i < leb_size; ++i) {
1392
1.62k
        uint8_t byte = value & 0x7f;
1393
1.62k
        value >>= 7;
1394
1395
1.62k
        if (value != 0) {
1396
336
            byte |= 0x80; // Signal that more bytes follow.
1397
336
        }
1398
1399
1.62k
        *(coded_value + i) = byte;
1400
1.62k
    }
1401
1402
1.29k
    *coded_size = leb_size;
1403
1.29k
    return 0;
1404
1.29k
}
1405
1406
860
int32_t svt_aom_wb_is_byte_aligned(const AomWriteBitBuffer* wb) {
1407
860
    return (wb->bit_offset % CHAR_BIT == 0);
1408
860
}
1409
1410
3.86k
uint32_t svt_aom_wb_bytes_written(const AomWriteBitBuffer* wb) {
1411
3.86k
    return wb->bit_offset / CHAR_BIT + (wb->bit_offset % CHAR_BIT > 0);
1412
3.86k
}
1413
1414
101k
INLINE static void svt_aom_wb_write_bit_inlined(AomWriteBitBuffer* wb, int32_t bit) {
1415
101k
    const int32_t off = (int32_t)wb->bit_offset;
1416
101k
    const int32_t p   = off / CHAR_BIT;
1417
101k
    const int32_t q   = CHAR_BIT - 1 - off % CHAR_BIT;
1418
101k
    if (q == CHAR_BIT - 1) {
1419
        // zero next char and write bit
1420
14.1k
        wb->bit_buffer[p] = (uint8_t)(bit << q);
1421
87.7k
    } else {
1422
87.7k
        wb->bit_buffer[p] &= ~(1 << q);
1423
87.7k
        wb->bit_buffer[p] |= bit << q;
1424
87.7k
    }
1425
101k
    wb->bit_offset = off + 1;
1426
101k
}
1427
1428
19.8k
INLINE static void svt_aom_wb_write_literal_inlined(AomWriteBitBuffer* wb, int32_t data, int32_t bits) {
1429
19.8k
    int32_t bit;
1430
94.9k
    for (bit = bits - 1; bit >= 0; bit--) {
1431
75.1k
        svt_aom_wb_write_bit(wb, (data >> bit) & 1);
1432
75.1k
    }
1433
19.8k
}
1434
1435
101k
void NOINLINE svt_aom_wb_write_bit(AomWriteBitBuffer* wb, int32_t bit) {
1436
101k
    svt_aom_wb_write_bit_inlined(wb, bit);
1437
101k
}
1438
1439
19.8k
void NOINLINE svt_aom_wb_write_literal(AomWriteBitBuffer* wb, int32_t data, int32_t bits) {
1440
19.8k
    svt_aom_wb_write_literal_inlined(wb, data, bits);
1441
19.8k
}
1442
1443
0
void NOINLINE svt_aom_wb_write_inv_signed_literal(AomWriteBitBuffer* wb, int32_t data, int32_t bits) {
1444
0
    svt_aom_wb_write_literal_inlined(wb, data, bits + 1);
1445
0
}
1446
1447
//*******************************************************************************************//
1448
1449
static void write_inter_mode(FRAME_CONTEXT* frame_context, AomWriter* ec_writer, PredictionMode mode,
1450
0
                             const int16_t mode_ctx, uint32_t blk_org_x, uint32_t blk_org_y) {
1451
0
    (void)blk_org_x;
1452
0
    (void)blk_org_y;
1453
0
    int16_t newmv_ctx = mode_ctx & NEWMV_CTX_MASK;
1454
0
    assert(newmv_ctx < NEWMV_MODE_CONTEXTS);
1455
0
    aom_write_symbol(ec_writer, mode != NEWMV, frame_context->newmv_cdf[newmv_ctx], 2);
1456
1457
0
    if (mode != NEWMV) {
1458
0
        const int16_t zeromv_ctx = (mode_ctx >> GLOBALMV_OFFSET) & GLOBALMV_CTX_MASK;
1459
0
        aom_write_symbol(ec_writer, mode != GLOBALMV, frame_context->zeromv_cdf[zeromv_ctx], 2);
1460
1461
0
        if (mode != GLOBALMV) {
1462
0
            int16_t refmv_ctx = (mode_ctx >> REFMV_OFFSET) & REFMV_CTX_MASK;
1463
0
            assert(refmv_ctx < REFMV_MODE_CONTEXTS);
1464
0
            aom_write_symbol(ec_writer, mode != NEARESTMV, frame_context->refmv_cdf[refmv_ctx], 2);
1465
0
        }
1466
0
    }
1467
0
}
1468
1469
//extern INLINE int8_t av1_ref_frame_type(const MvReferenceFrame *const rf);
1470
static void write_drl_idx(FRAME_CONTEXT* frame_context, AomWriter* ec_writer, MbModeInfo* mbmi,
1471
1472
0
                          EcBlkStruct* blk_ptr) {
1473
0
    const int32_t new_mv = mbmi->block_mi.mode == NEWMV || mbmi->block_mi.mode == NEW_NEWMV;
1474
0
    if (new_mv) {
1475
0
        int32_t idx;
1476
0
        for (idx = 0; idx < 2; ++idx) {
1477
0
            if (blk_ptr->drl_ctx[idx] != -1) {
1478
0
                uint8_t drl_ctx = (uint8_t)blk_ptr->drl_ctx[idx];
1479
1480
0
                aom_write_symbol(ec_writer, blk_ptr->drl_index != idx, frame_context->drl_cdf[drl_ctx], 2);
1481
1482
0
                if (blk_ptr->drl_index == idx) {
1483
0
                    return;
1484
0
                }
1485
0
            }
1486
0
        }
1487
0
        return;
1488
0
    }
1489
1490
0
    if (have_nearmv_in_inter_mode(mbmi->block_mi.mode)) {
1491
0
        int32_t idx;
1492
        // TODO(jingning): Temporary solution to compensate the NEARESTMV offset.
1493
0
        for (idx = 1; idx < 3; ++idx) {
1494
0
            if (blk_ptr->drl_ctx_near[idx - 1] != -1) {
1495
0
                uint8_t drl_ctx = (uint8_t)blk_ptr->drl_ctx_near[idx - 1];
1496
1497
0
                aom_write_symbol(ec_writer, blk_ptr->drl_index != (idx - 1), frame_context->drl_cdf[drl_ctx], 2);
1498
1499
0
                if (blk_ptr->drl_index == (idx - 1)) {
1500
0
                    return;
1501
0
                }
1502
0
            }
1503
0
        }
1504
0
        return;
1505
0
    }
1506
0
}
1507
1508
0
static void encode_mv_component(AomWriter* w, int32_t comp, NmvComponent* mvcomp, MvSubpelPrecision precision) {
1509
0
    int32_t       offset;
1510
0
    const int32_t sign     = comp < 0;
1511
0
    const int32_t mag      = sign ? -comp : comp;
1512
0
    const int32_t mv_class = svt_av1_get_mv_class(mag - 1, &offset);
1513
0
    const int32_t d        = offset >> 3; // int32_t mv data
1514
0
    const int32_t fr       = (offset >> 1) & 3; // fractional mv data
1515
0
    const int32_t hp       = offset & 1; // high precision mv data
1516
1517
0
    assert(comp != 0);
1518
1519
    // Sign
1520
0
    aom_write_symbol(w, sign, mvcomp->sign_cdf, 2);
1521
1522
    // Class
1523
0
    aom_write_symbol(w, mv_class, mvcomp->classes_cdf, MV_CLASSES);
1524
1525
    // Integer bits
1526
0
    if (mv_class == MV_CLASS_0) {
1527
0
        aom_write_symbol(w, d, mvcomp->class0_cdf, CLASS0_SIZE);
1528
0
    } else {
1529
0
        int32_t       i;
1530
0
        const int32_t n = mv_class + CLASS0_BITS - 1; // number of bits
1531
0
        for (i = 0; i < n; ++i) {
1532
0
            aom_write_symbol(w, (d >> i) & 1, mvcomp->bits_cdf[i], 2);
1533
0
        }
1534
0
    }
1535
    // Fractional bits
1536
0
    if (precision > MV_SUBPEL_NONE) {
1537
0
        aom_write_symbol(w, fr, mv_class == MV_CLASS_0 ? mvcomp->class0_fp_cdf[d] : mvcomp->fp_cdf, MV_FP_SIZE);
1538
0
    }
1539
1540
    // High precision bit
1541
0
    if (precision > MV_SUBPEL_LOW_PRECISION) {
1542
0
        aom_write_symbol(w, hp, mv_class == MV_CLASS_0 ? mvcomp->class0_hp_cdf : mvcomp->hp_cdf, 2);
1543
0
    }
1544
0
}
1545
1546
// can't mark the parameter as const due to MSVC not supporting c99 fully.
1547
#ifdef _MSC_VER
1548
static MvJointType av1_get_mv_joint_diff(const int32_t diff[2]) {
1549
#else
1550
0
static MvJointType av1_get_mv_joint_diff(const int32_t diff[const 2]) {
1551
0
#endif
1552
0
    if (diff[0] == 0) {
1553
0
        return diff[1] == 0 ? MV_JOINT_ZERO : MV_JOINT_HNZVZ;
1554
0
    }
1555
0
    return diff[1] == 0 ? MV_JOINT_HZVNZ : MV_JOINT_HNZVNZ;
1556
0
}
1557
1558
void svt_av1_encode_mv(PictureParentControlSet* pcs, AomWriter* ec_writer, const Mv* mv, const Mv* ref,
1559
0
                       NmvContext* mvctx, int32_t usehp) {
1560
    // The y-component (row component) of the MV is coded first
1561
0
    int32_t           diff[2] = {mv->y - ref->y, mv->x - ref->x};
1562
0
    const MvJointType j       = av1_get_mv_joint_diff(diff);
1563
1564
0
    if (pcs->frm_hdr.force_integer_mv) {
1565
0
        usehp = MV_SUBPEL_NONE;
1566
0
    }
1567
0
    aom_write_symbol(ec_writer, j, mvctx->joints_cdf, MV_JOINTS);
1568
0
    if (mv_joint_vertical(j)) {
1569
0
        encode_mv_component(ec_writer, diff[0], &mvctx->comps[0], (MvSubpelPrecision)usehp);
1570
0
    }
1571
1572
0
    if (mv_joint_horizontal(j)) {
1573
0
        encode_mv_component(ec_writer, diff[1], &mvctx->comps[1], (MvSubpelPrecision)usehp);
1574
0
    }
1575
1576
    // If auto_mv_step_size is enabled then keep track of the largest
1577
    // motion vector component used.
1578
    //if (cpi->sf.mv.auto_mv_step_size) {
1579
    //    uint32_t maxv = AOMMAX(abs(mv->row), abs(mv->col)) >> 3;
1580
    //    cpi->max_mv_magnitude = AOMMAX(maxv, cpi->max_mv_magnitude);
1581
    //}
1582
0
}
1583
1584
//Returns a context number for the given MB prediction signal
1585
0
static InterpFilter svt_aom_get_ref_filter_type(const BlockModeInfo* ref_mbmi, int dir, MvReferenceFrame ref_frame) {
1586
0
    return ((ref_mbmi->ref_frame[0] == ref_frame || ref_mbmi->ref_frame[1] == ref_frame)
1587
0
                ? av1_extract_interp_filter(ref_mbmi->interp_filters, dir & 0x01)
1588
0
                : SWITCHABLE_FILTERS);
1589
0
}
1590
1591
/* Get the context for the interpolation filter when SWITCHABLE filter is specified
1592
at the frame level.  Used for computing rate and for entropy coding. */
1593
int svt_aom_get_pred_context_switchable_interp(MvReferenceFrame rf0, MvReferenceFrame rf1, const MacroBlockD* xd,
1594
0
                                               int dir) {
1595
    /* When calling the function from MD, the current MBMI may not be updated yet, so pass
1596
       the ref frames instead of getting them from the current mbmi (as you could below):
1597
1598
            const MbModeInfo* const mbmi = &xd->mi[0]->mbmi;
1599
            const int ctx_offset = (mbmi->block_mi.ref_frame[1] > INTRA_FRAME) * INTER_FILTER_COMP_OFFSET;
1600
            assert(dir == 0 || dir == 1);
1601
            const MvReferenceFrame ref_frame = mbmi->block_mi.ref_frame[0];
1602
    */
1603
1604
0
    const int32_t ctx_offset = (rf1 > INTRA_FRAME) * INTER_FILTER_COMP_OFFSET;
1605
0
    assert(dir == 0 || dir == 1);
1606
0
    MvReferenceFrame ref_frame = rf0;
1607
1608
    // Note:
1609
    // The mode info data structure has a one element border above and to the
1610
    // left of the entries corresponding to real macroblocks.
1611
    // The prediction flags in these dummy entries are initialized to 0.
1612
0
    int filter_type_ctx = ctx_offset + (dir & 0x01) * INTER_FILTER_DIR_OFFSET;
1613
0
    int left_type       = SWITCHABLE_FILTERS;
1614
0
    int above_type      = SWITCHABLE_FILTERS;
1615
1616
0
    if (xd->left_available) {
1617
0
        left_type = svt_aom_get_ref_filter_type(&xd->mi[-1]->block_mi, dir, ref_frame);
1618
0
    }
1619
1620
0
    if (xd->up_available) {
1621
0
        above_type = svt_aom_get_ref_filter_type(&xd->mi[-xd->mi_stride]->block_mi, dir, ref_frame);
1622
0
    }
1623
1624
0
    if (left_type == above_type) {
1625
0
        filter_type_ctx += left_type;
1626
0
    } else if (left_type == SWITCHABLE_FILTERS) {
1627
0
        assert(above_type != SWITCHABLE_FILTERS);
1628
0
        filter_type_ctx += above_type;
1629
0
    } else if (above_type == SWITCHABLE_FILTERS) {
1630
0
        assert(left_type != SWITCHABLE_FILTERS);
1631
0
        filter_type_ctx += left_type;
1632
0
    } else {
1633
0
        filter_type_ctx += SWITCHABLE_FILTERS;
1634
0
    }
1635
0
    return filter_type_ctx;
1636
0
}
1637
1638
int svt_aom_is_nontrans_global_motion(const BlockModeInfo* block_mi, const BlockSize bsize,
1639
0
                                      PictureParentControlSet* pcs) {
1640
    // First check if all modes are GLOBALMV
1641
0
    if (block_mi->mode != GLOBALMV && block_mi->mode != GLOBAL_GLOBALMV) {
1642
0
        return 0;
1643
0
    }
1644
1645
0
    if (MIN(mi_size_wide[bsize], mi_size_high[bsize]) < 2) {
1646
0
        return 0;
1647
0
    }
1648
0
    const uint8_t is_compound = is_inter_compound_mode(block_mi->mode);
1649
    // Now check if all global motion is non translational
1650
0
    for (int ref = 0; ref < 1 + is_compound; ++ref) {
1651
0
        if (pcs->global_motion[block_mi->ref_frame[ref]].wmtype == TRANSLATION) {
1652
0
            return 0;
1653
0
        }
1654
0
    }
1655
0
    return 1;
1656
0
}
1657
1658
0
static int av1_is_interp_needed(const BlockModeInfo* block_mi, const BlockSize bsize, PictureParentControlSet* pcs) {
1659
0
    if (block_mi->skip_mode) {
1660
0
        return 0;
1661
0
    }
1662
1663
0
    if (block_mi->motion_mode == WARPED_CAUSAL) {
1664
0
        return 0;
1665
0
    }
1666
1667
0
    if (svt_aom_is_nontrans_global_motion(block_mi, bsize, pcs)) {
1668
0
        return 0;
1669
0
    }
1670
1671
0
    return 1;
1672
0
}
1673
1674
static void write_mb_interp_filter(BlockSize bsize, MvReferenceFrame rf0, MvReferenceFrame rf1,
1675
                                   PictureParentControlSet* pcs, AomWriter* ec_writer, MbModeInfo* mbmi,
1676
0
                                   EcBlkStruct* blk_ptr, EntropyCoder* ec) {
1677
0
    FrameHeader* const frm_hdr = &pcs->frm_hdr;
1678
1679
0
    if (frm_hdr->interpolation_filter != SWITCHABLE || !av1_is_interp_needed(&mbmi->block_mi, bsize, pcs)) {
1680
0
        return;
1681
0
    }
1682
1683
0
    const int max_dir = pcs->scs->seq_header.enable_dual_filter ? 2 : 1;
1684
0
    for (int dir = 0; dir < max_dir; ++dir) {
1685
0
        const int    ctx    = svt_aom_get_pred_context_switchable_interp(rf0, rf1, blk_ptr->av1xd, dir);
1686
0
        InterpFilter filter = av1_extract_interp_filter(mbmi->block_mi.interp_filters, dir);
1687
0
        assert(ctx < SWITCHABLE_FILTER_CONTEXTS);
1688
0
        assert(filter < CDF_SIZE(SWITCHABLE_FILTERS));
1689
0
        aom_write_symbol(ec_writer, filter, ec->fc->switchable_interp_cdf[ctx], SWITCHABLE_FILTERS);
1690
0
    }
1691
0
}
1692
1693
static void write_inter_compound_mode(FRAME_CONTEXT* frame_context, AomWriter* ec_writer, PredictionMode mode,
1694
0
                                      const int16_t mode_ctx) {
1695
0
    assert(is_inter_compound_mode(mode));
1696
0
    aom_write_symbol(
1697
0
        ec_writer, INTER_COMPOUND_OFFSET(mode), frame_context->inter_compound_mode_cdf[mode_ctx], INTER_COMPOUND_MODES);
1698
0
}
1699
1700
int svt_aom_get_reference_mode_context_new(const MacroBlockD* xd);
1701
1702
0
AomCdfProb* svt_aom_get_reference_mode_cdf(const MacroBlockD* xd) {
1703
0
    return xd->tile_ctx->comp_inter_cdf[svt_aom_get_reference_mode_context_new(xd)];
1704
0
}
1705
1706
int svt_aom_get_comp_reference_type_context_new(const MacroBlockD* xd);
1707
1708
// == Uni-directional contexts ==
1709
1710
int svt_av1_get_pred_context_uni_comp_ref_p(const MacroBlockD* xd);
1711
1712
int svt_av1_get_pred_context_uni_comp_ref_p1(const MacroBlockD* xd);
1713
1714
int svt_av1_get_pred_context_uni_comp_ref_p2(const MacroBlockD* xd);
1715
1716
0
AomCdfProb* svt_aom_get_comp_reference_type_cdf(const MacroBlockD* xd) {
1717
0
    const int pred_context = svt_aom_get_comp_reference_type_context_new(xd);
1718
0
    return xd->tile_ctx->comp_ref_type_cdf[pred_context];
1719
0
}
1720
1721
0
AomCdfProb* svt_aom_get_pred_cdf_uni_comp_ref_p(const MacroBlockD* xd) {
1722
0
    const int pred_context = svt_av1_get_pred_context_uni_comp_ref_p(xd);
1723
0
    return xd->tile_ctx->uni_comp_ref_cdf[pred_context][0];
1724
0
}
1725
1726
0
AomCdfProb* svt_aom_get_pred_cdf_uni_comp_ref_p1(const MacroBlockD* xd) {
1727
0
    const int pred_context = svt_av1_get_pred_context_uni_comp_ref_p1(xd);
1728
0
    return xd->tile_ctx->uni_comp_ref_cdf[pred_context][1];
1729
0
}
1730
1731
0
AomCdfProb* svt_aom_get_pred_cdf_uni_comp_ref_p2(const MacroBlockD* xd) {
1732
0
    const int pred_context = svt_av1_get_pred_context_uni_comp_ref_p2(xd);
1733
0
    return xd->tile_ctx->uni_comp_ref_cdf[pred_context][2];
1734
0
}
1735
1736
0
AomCdfProb* svt_aom_get_pred_cdf_comp_ref_p(const MacroBlockD* xd) {
1737
0
    const int pred_context = svt_av1_get_pred_context_comp_ref_p(xd);
1738
0
    return xd->tile_ctx->comp_ref_cdf[pred_context][0];
1739
0
}
1740
1741
0
AomCdfProb* svt_aom_get_pred_cdf_comp_ref_p1(const MacroBlockD* xd) {
1742
0
    const int pred_context = svt_av1_get_pred_context_comp_ref_p1(xd);
1743
0
    return xd->tile_ctx->comp_ref_cdf[pred_context][1];
1744
0
}
1745
1746
0
AomCdfProb* svt_aom_get_pred_cdf_comp_ref_p2(const MacroBlockD* xd) {
1747
0
    const int pred_context = svt_av1_get_pred_context_comp_ref_p2(xd);
1748
0
    return xd->tile_ctx->comp_ref_cdf[pred_context][2];
1749
0
}
1750
1751
0
AomCdfProb* svt_aom_get_pred_cdf_comp_bwdref_p(const MacroBlockD* xd) {
1752
0
    const int pred_context = svt_av1_get_pred_context_comp_bwdref_p(xd);
1753
0
    return xd->tile_ctx->comp_bwdref_cdf[pred_context][0];
1754
0
}
1755
1756
0
AomCdfProb* svt_aom_get_pred_cdf_comp_bwdref_p1(const MacroBlockD* xd) {
1757
0
    const int pred_context = svt_av1_get_pred_context_comp_bwdref_p1(xd);
1758
0
    return xd->tile_ctx->comp_bwdref_cdf[pred_context][1];
1759
0
}
1760
1761
0
int svt_aom_get_comp_reference_type_context_new(const MacroBlockD* xd) {
1762
0
    int                     pred_context;
1763
0
    const MbModeInfo* const above_mbmi     = xd->above_mbmi;
1764
0
    const MbModeInfo* const left_mbmi      = xd->left_mbmi;
1765
0
    const int               above_in_image = xd->up_available;
1766
0
    const int               left_in_image  = xd->left_available;
1767
1768
0
    if (above_in_image && left_in_image) { // both edges available
1769
0
        const int above_intra = !is_inter_block(&above_mbmi->block_mi);
1770
0
        const int left_intra  = !is_inter_block(&left_mbmi->block_mi);
1771
1772
0
        if (above_intra && left_intra) { // intra/intra
1773
0
            pred_context = 2;
1774
0
        } else if (above_intra || left_intra) { // intra/inter
1775
0
            const MbModeInfo* inter_mbmi = above_intra ? left_mbmi : above_mbmi;
1776
1777
0
            if (!has_second_ref(&inter_mbmi->block_mi)) { // single pred
1778
0
                pred_context = 2;
1779
0
            } else { // comp pred
1780
0
                pred_context = 1 + 2 * has_uni_comp_refs(&inter_mbmi->block_mi);
1781
0
            }
1782
0
        } else { // inter/inter
1783
0
            const int              a_sg = !has_second_ref(&above_mbmi->block_mi);
1784
0
            const int              l_sg = !has_second_ref(&left_mbmi->block_mi);
1785
0
            const MvReferenceFrame frfa = above_mbmi->block_mi.ref_frame[0];
1786
0
            const MvReferenceFrame frfl = left_mbmi->block_mi.ref_frame[0];
1787
1788
0
            if (a_sg && l_sg) { // single/single
1789
0
                pred_context = 1 + 2 * (!(IS_BACKWARD_REF_FRAME(frfa) ^ IS_BACKWARD_REF_FRAME(frfl)));
1790
0
            } else if (l_sg || a_sg) { // single/comp
1791
0
                const int uni_rfc = a_sg ? has_uni_comp_refs(&left_mbmi->block_mi)
1792
0
                                         : has_uni_comp_refs(&above_mbmi->block_mi);
1793
1794
0
                if (!uni_rfc) { // comp bidir
1795
0
                    pred_context = 1;
1796
0
                } else { // comp unidir
1797
0
                    pred_context = 3 + (!(IS_BACKWARD_REF_FRAME(frfa) ^ IS_BACKWARD_REF_FRAME(frfl)));
1798
0
                }
1799
0
            } else { // comp/comp
1800
0
                const int a_uni_rfc = has_uni_comp_refs(&above_mbmi->block_mi);
1801
0
                const int l_uni_rfc = has_uni_comp_refs(&left_mbmi->block_mi);
1802
1803
0
                if (!a_uni_rfc && !l_uni_rfc) { // bidir/bidir
1804
0
                    pred_context = 0;
1805
0
                } else if (!a_uni_rfc || !l_uni_rfc) { // unidir/bidir
1806
0
                    pred_context = 2;
1807
0
                } else { // unidir/unidir
1808
0
                    pred_context = 3 + (!((frfa == BWDREF_FRAME) ^ (frfl == BWDREF_FRAME)));
1809
0
                }
1810
0
            }
1811
0
        }
1812
0
    } else if (above_in_image || left_in_image) { // one edge available
1813
0
        const MbModeInfo* edge_mbmi = above_in_image ? above_mbmi : left_mbmi;
1814
1815
0
        if (!is_inter_block(&edge_mbmi->block_mi)) { // intra
1816
0
            pred_context = 2;
1817
0
        } else { // inter
1818
0
            if (!has_second_ref(&edge_mbmi->block_mi)) { // single pred
1819
0
                pred_context = 2;
1820
0
            } else { // comp pred
1821
0
                pred_context = 4 * has_uni_comp_refs(&edge_mbmi->block_mi);
1822
0
            }
1823
0
        }
1824
0
    } else { // no edges available
1825
0
        pred_context = 2;
1826
0
    }
1827
1828
0
    assert(pred_context >= 0 && pred_context < COMP_REF_TYPE_CONTEXTS);
1829
0
    return pred_context;
1830
0
}
1831
1832
// Returns a context number for the given MB prediction signal
1833
//
1834
// Signal the uni-directional compound reference frame pair as either
1835
// (BWDREF, ALTREF), or (LAST, LAST2) / (LAST, LAST3) / (LAST, GOLDEN),
1836
// conditioning on the pair is known as uni-directional.
1837
//
1838
// 3 contexts: Voting is used to compare the count of forward references with
1839
//             that of backward references from the spatial neighbors.
1840
0
int svt_av1_get_pred_context_uni_comp_ref_p(const MacroBlockD* xd) {
1841
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
1842
1843
    // Count of forward references (L, L2, L3, or G)
1844
0
    const int frf_count = ref_counts[LAST_FRAME] + ref_counts[LAST2_FRAME] + ref_counts[LAST3_FRAME] +
1845
0
        ref_counts[GOLDEN_FRAME];
1846
    // Count of backward references (b or A)
1847
0
    const int brf_count = ref_counts[BWDREF_FRAME] + ref_counts[ALTREF2_FRAME] + ref_counts[ALTREF_FRAME];
1848
1849
0
    const int pred_context = (frf_count == brf_count) ? 1 : ((frf_count < brf_count) ? 0 : 2);
1850
1851
0
    assert(pred_context >= 0 && pred_context < UNI_COMP_REF_CONTEXTS);
1852
0
    return pred_context;
1853
0
}
1854
1855
// Returns a context number for the given MB prediction signal
1856
//
1857
// Signal the uni-directional compound reference frame pair as
1858
// either (LAST, LAST2), or (LAST, LAST3) / (LAST, GOLDEN),
1859
// conditioning on the pair is known as one of the above three.
1860
//
1861
// 3 contexts: Voting is used to compare the count of LAST2_FRAME with the
1862
//             total count of LAST3/GOLDEN from the spatial neighbors.
1863
0
int svt_av1_get_pred_context_uni_comp_ref_p1(const MacroBlockD* xd) {
1864
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
1865
1866
    // Count of LAST2
1867
0
    const int last2_count = ref_counts[LAST2_FRAME];
1868
    // Count of LAST3 or GOLDEN
1869
0
    const int last3_or_gld_count = ref_counts[LAST3_FRAME] + ref_counts[GOLDEN_FRAME];
1870
1871
0
    const int pred_context = (last2_count == last3_or_gld_count) ? 1 : ((last2_count < last3_or_gld_count) ? 0 : 2);
1872
1873
0
    assert(pred_context >= 0 && pred_context < UNI_COMP_REF_CONTEXTS);
1874
0
    return pred_context;
1875
0
}
1876
1877
// Returns a context number for the given MB prediction signal
1878
//
1879
// Signal the uni-directional compound reference frame pair as
1880
// either (LAST, LAST3) or (LAST, GOLDEN),
1881
// conditioning on the pair is known as one of the above two.
1882
//
1883
// 3 contexts: Voting is used to compare the count of LAST3_FRAME with the
1884
//             total count of GOLDEN_FRAME from the spatial neighbors.
1885
0
int svt_av1_get_pred_context_uni_comp_ref_p2(const MacroBlockD* xd) {
1886
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
1887
1888
    // Count of LAST3
1889
0
    const int last3_count = ref_counts[LAST3_FRAME];
1890
    // Count of GOLDEN
1891
0
    const int gld_count = ref_counts[GOLDEN_FRAME];
1892
1893
0
    const int pred_context = (last3_count == gld_count) ? 1 : ((last3_count < gld_count) ? 0 : 2);
1894
1895
0
    assert(pred_context >= 0 && pred_context < UNI_COMP_REF_CONTEXTS);
1896
0
    return pred_context;
1897
0
}
1898
1899
0
int svt_aom_get_reference_mode_context_new(const MacroBlockD* xd) {
1900
0
    int                     ctx;
1901
0
    const MbModeInfo* const above_mbmi = xd->above_mbmi;
1902
0
    const MbModeInfo* const left_mbmi  = xd->left_mbmi;
1903
0
    const int               has_above  = xd->up_available;
1904
0
    const int               has_left   = xd->left_available;
1905
1906
    // Note:
1907
    // The mode info data structure has a one element border above and to the
1908
    // left of the entries corresponding to real macroblocks.
1909
    // The prediction flags in these dummy entries are initialized to 0.
1910
0
    if (has_above && has_left) { // both edges available
1911
0
        if (!has_second_ref(&above_mbmi->block_mi) && !has_second_ref(&left_mbmi->block_mi)) {
1912
            // neither edge uses comp pred (0/1)
1913
0
            ctx = IS_BACKWARD_REF_FRAME(above_mbmi->block_mi.ref_frame[0]) ^
1914
0
                IS_BACKWARD_REF_FRAME(left_mbmi->block_mi.ref_frame[0]);
1915
0
        } else if (!has_second_ref(&above_mbmi->block_mi)) {
1916
            // one of two edges uses comp pred (2/3)
1917
0
            ctx = 2 +
1918
0
                (IS_BACKWARD_REF_FRAME(above_mbmi->block_mi.ref_frame[0]) || !is_inter_block(&above_mbmi->block_mi));
1919
0
        } else if (!has_second_ref(&left_mbmi->block_mi)) {
1920
            // one of two edges uses comp pred (2/3)
1921
0
            ctx = 2 +
1922
0
                (IS_BACKWARD_REF_FRAME(left_mbmi->block_mi.ref_frame[0]) || !is_inter_block(&left_mbmi->block_mi));
1923
0
        } else { // both edges use comp pred (4)
1924
0
            ctx = 4;
1925
0
        }
1926
0
    } else if (has_above || has_left) { // one edge available
1927
0
        const MbModeInfo* edge_mbmi = has_above ? above_mbmi : left_mbmi;
1928
1929
0
        if (!has_second_ref(&edge_mbmi->block_mi)) {
1930
            // edge does not use comp pred (0/1)
1931
0
            ctx = IS_BACKWARD_REF_FRAME(edge_mbmi->block_mi.ref_frame[0]);
1932
0
        } else {
1933
            // edge uses comp pred (3)
1934
0
            ctx = 3;
1935
0
        }
1936
0
    } else { // no edges available (1)
1937
0
        ctx = 1;
1938
0
    }
1939
0
    assert(ctx >= 0 && ctx < COMP_INTER_CONTEXTS);
1940
0
    return ctx;
1941
0
}
1942
1943
0
void svt_aom_collect_neighbors_ref_counts_new(MacroBlockD* const xd) {
1944
0
    av1_zero(xd->neighbors_ref_counts);
1945
1946
0
    uint8_t* const ref_counts = xd->neighbors_ref_counts;
1947
1948
0
    const MbModeInfo* const above_mbmi     = xd->above_mbmi;
1949
0
    const MbModeInfo* const left_mbmi      = xd->left_mbmi;
1950
0
    const int               above_in_image = xd->up_available;
1951
0
    const int               left_in_image  = xd->left_available;
1952
1953
    // Above neighbor
1954
0
    if (above_in_image && is_inter_block(&above_mbmi->block_mi)) {
1955
0
        ref_counts[above_mbmi->block_mi.ref_frame[0]]++;
1956
0
        if (has_second_ref(&above_mbmi->block_mi)) {
1957
0
            ref_counts[above_mbmi->block_mi.ref_frame[1]]++;
1958
0
        }
1959
0
    }
1960
1961
    // Left neighbor
1962
0
    if (left_in_image && is_inter_block(&left_mbmi->block_mi)) {
1963
0
        ref_counts[left_mbmi->block_mi.ref_frame[0]]++;
1964
0
        if (has_second_ref(&left_mbmi->block_mi)) {
1965
0
            ref_counts[left_mbmi->block_mi.ref_frame[1]]++;
1966
0
        }
1967
0
    }
1968
0
}
1969
1970
0
#define WRITE_REF_BIT(bname, pname) aom_write_symbol(w, bname, svt_aom_get_pred_cdf_##pname(xd), 2)
1971
1972
/***************************************************************************************/
1973
1974
// == Common context functions for both comp and single ref ==
1975
//
1976
// Obtain contexts to signal a reference frame to be either LAST/LAST2 or
1977
// LAST3/GOLDEN.
1978
0
static int32_t get_pred_context_ll2_or_l3gld(const MacroBlockD* xd) {
1979
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
1980
1981
    // Count of LAST + LAST2
1982
0
    const int32_t last_last2_count = ref_counts[LAST_FRAME] + ref_counts[LAST2_FRAME];
1983
    // Count of LAST3 + GOLDEN
1984
0
    const int32_t last3_gld_count = ref_counts[LAST3_FRAME] + ref_counts[GOLDEN_FRAME];
1985
1986
0
    const int32_t pred_context = (last_last2_count == last3_gld_count) ? 1
1987
0
                                                                       : ((last_last2_count < last3_gld_count) ? 0 : 2);
1988
1989
0
    assert(pred_context >= 0 && pred_context < REF_CONTEXTS);
1990
0
    return pred_context;
1991
0
}
1992
1993
// Obtain contexts to signal a reference frame to be either LAST or LAST2.
1994
0
static int32_t get_pred_context_last_or_last2(const MacroBlockD* xd) {
1995
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
1996
1997
    // Count of LAST
1998
0
    const int32_t last_count = ref_counts[LAST_FRAME];
1999
    // Count of LAST2
2000
0
    const int32_t last2_count = ref_counts[LAST2_FRAME];
2001
2002
0
    const int32_t pred_context = (last_count == last2_count) ? 1 : ((last_count < last2_count) ? 0 : 2);
2003
2004
0
    assert(pred_context >= 0 && pred_context < REF_CONTEXTS);
2005
0
    return pred_context;
2006
0
}
2007
2008
// Obtain contexts to signal a reference frame to be either LAST3 or GOLDEN.
2009
0
static int32_t get_pred_context_last3_or_gld(const MacroBlockD* xd) {
2010
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
2011
2012
    // Count of LAST3
2013
0
    const int32_t last3_count = ref_counts[LAST3_FRAME];
2014
    // Count of GOLDEN
2015
0
    const int32_t gld_count = ref_counts[GOLDEN_FRAME];
2016
2017
0
    const int32_t pred_context = (last3_count == gld_count) ? 1 : ((last3_count < gld_count) ? 0 : 2);
2018
2019
0
    assert(pred_context >= 0 && pred_context < REF_CONTEXTS);
2020
0
    return pred_context;
2021
0
}
2022
2023
// Obtain contexts to signal a reference frame be either BWDREF/ALTREF2, or
2024
// ALTREF.
2025
0
static int32_t get_pred_context_brfarf2_or_arf(const MacroBlockD* xd) {
2026
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
2027
2028
    // Counts of BWDREF, ALTREF2, or ALTREF frames (b, A2, or A)
2029
0
    const int32_t brfarf2_count = ref_counts[BWDREF_FRAME] + ref_counts[ALTREF2_FRAME];
2030
0
    const int32_t arf_count     = ref_counts[ALTREF_FRAME];
2031
2032
0
    const int32_t pred_context = (brfarf2_count == arf_count) ? 1 : ((brfarf2_count < arf_count) ? 0 : 2);
2033
2034
0
    assert(pred_context >= 0 && pred_context < REF_CONTEXTS);
2035
0
    return pred_context;
2036
0
}
2037
2038
// Obtain contexts to signal a reference frame be either BWDREF or ALTREF2.
2039
0
static int32_t get_pred_context_brf_or_arf2(const MacroBlockD* xd) {
2040
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
2041
2042
    // Count of BWDREF frames (b)
2043
0
    const int32_t brf_count = ref_counts[BWDREF_FRAME];
2044
    // Count of ALTREF2 frames (A2)
2045
0
    const int32_t arf2_count = ref_counts[ALTREF2_FRAME];
2046
2047
0
    const int32_t pred_context = (brf_count == arf2_count) ? 1 : ((brf_count < arf2_count) ? 0 : 2);
2048
2049
0
    assert(pred_context >= 0 && pred_context < REF_CONTEXTS);
2050
0
    return pred_context;
2051
0
}
2052
2053
// == Context functions for comp ref ==
2054
//
2055
// Returns a context number for the given MB prediction signal
2056
// Signal the first reference frame for a compound mode be either
2057
// GOLDEN/LAST3, or LAST/LAST2.
2058
0
int32_t svt_av1_get_pred_context_comp_ref_p(const MacroBlockD* xd) {
2059
0
    return get_pred_context_ll2_or_l3gld(xd);
2060
0
}
2061
2062
// Returns a context number for the given MB prediction signal
2063
// Signal the first reference frame for a compound mode be LAST,
2064
// conditioning on that it is known either LAST/LAST2.
2065
0
int32_t svt_av1_get_pred_context_comp_ref_p1(const MacroBlockD* xd) {
2066
0
    return get_pred_context_last_or_last2(xd);
2067
0
}
2068
2069
// Returns a context number for the given MB prediction signal
2070
// Signal the first reference frame for a compound mode be GOLDEN,
2071
// conditioning on that it is known either GOLDEN or LAST3.
2072
0
int32_t svt_av1_get_pred_context_comp_ref_p2(const MacroBlockD* xd) {
2073
0
    return get_pred_context_last3_or_gld(xd);
2074
0
}
2075
2076
// Signal the 2nd reference frame for a compound mode be either
2077
// ALTREF, or ALTREF2/BWDREF.
2078
0
int32_t svt_av1_get_pred_context_comp_bwdref_p(const MacroBlockD* xd) {
2079
0
    return get_pred_context_brfarf2_or_arf(xd);
2080
0
}
2081
2082
// Signal the 2nd reference frame for a compound mode be either
2083
// ALTREF2 or BWDREF.
2084
0
int32_t svt_av1_get_pred_context_comp_bwdref_p1(const MacroBlockD* xd) {
2085
0
    return get_pred_context_brf_or_arf2(xd);
2086
0
}
2087
2088
// == Context functions for single ref ==
2089
//
2090
// For the bit to signal whether the single reference is a forward reference
2091
// frame or a backward reference frame.
2092
0
int32_t svt_av1_get_pred_context_single_ref_p1(const MacroBlockD* xd) {
2093
0
    const uint8_t* const ref_counts = &xd->neighbors_ref_counts[0];
2094
2095
    // Count of forward reference frames
2096
0
    const int32_t fwd_count = ref_counts[LAST_FRAME] + ref_counts[LAST2_FRAME] + ref_counts[LAST3_FRAME] +
2097
0
        ref_counts[GOLDEN_FRAME];
2098
    // Count of backward reference frames
2099
0
    const int32_t bwd_count = ref_counts[BWDREF_FRAME] + ref_counts[ALTREF2_FRAME] + ref_counts[ALTREF_FRAME];
2100
2101
0
    const int32_t pred_context = (fwd_count == bwd_count) ? 1 : ((fwd_count < bwd_count) ? 0 : 2);
2102
2103
0
    assert(pred_context >= 0 && pred_context < REF_CONTEXTS);
2104
0
    return pred_context;
2105
0
}
2106
2107
0
AomCdfProb* svt_aom_get_pred_cdf_single_ref_p1(const MacroBlockD* xd) {
2108
0
    return xd->tile_ctx->single_ref_cdf[svt_av1_get_pred_context_single_ref_p1(xd)][0];
2109
0
}
2110
2111
0
AomCdfProb* svt_aom_get_pred_cdf_single_ref_p2(const MacroBlockD* xd) {
2112
0
    return xd->tile_ctx->single_ref_cdf[svt_av1_get_pred_context_single_ref_p2(xd)][1];
2113
0
}
2114
2115
0
AomCdfProb* svt_aom_get_pred_cdf_single_ref_p3(const MacroBlockD* xd) {
2116
0
    return xd->tile_ctx->single_ref_cdf[svt_av1_get_pred_context_single_ref_p3(xd)][2];
2117
0
}
2118
2119
0
AomCdfProb* svt_aom_get_pred_cdf_single_ref_p4(const MacroBlockD* xd) {
2120
0
    return xd->tile_ctx->single_ref_cdf[svt_av1_get_pred_context_single_ref_p4(xd)][3];
2121
0
}
2122
2123
0
AomCdfProb* svt_aom_get_pred_cdf_single_ref_p5(const MacroBlockD* xd) {
2124
0
    return xd->tile_ctx->single_ref_cdf[svt_av1_get_pred_context_single_ref_p5(xd)][4];
2125
0
}
2126
2127
0
AomCdfProb* svt_aom_get_pred_cdf_single_ref_p6(const MacroBlockD* xd) {
2128
0
    return xd->tile_ctx->single_ref_cdf[svt_av1_get_pred_context_single_ref_p6(xd)][5];
2129
0
}
2130
2131
// For the bit to signal whether the single reference is ALTREF_FRAME or
2132
// non-ALTREF backward reference frame, knowing that it shall be either of
2133
// these 2 choices.
2134
0
int32_t svt_av1_get_pred_context_single_ref_p2(const MacroBlockD* xd) {
2135
0
    return get_pred_context_brfarf2_or_arf(xd);
2136
0
}
2137
2138
// For the bit to signal whether the single reference is LAST3/GOLDEN or
2139
// LAST2/LAST, knowing that it shall be either of these 2 choices.
2140
0
int32_t svt_av1_get_pred_context_single_ref_p3(const MacroBlockD* xd) {
2141
0
    return get_pred_context_ll2_or_l3gld(xd);
2142
0
}
2143
2144
// For the bit to signal whether the single reference is LAST2_FRAME or
2145
// LAST_FRAME, knowing that it shall be either of these 2 choices.
2146
0
int32_t svt_av1_get_pred_context_single_ref_p4(const MacroBlockD* xd) {
2147
0
    return get_pred_context_last_or_last2(xd);
2148
0
}
2149
2150
// For the bit to signal whether the single reference is GOLDEN_FRAME or
2151
// LAST3_FRAME, knowing that it shall be either of these 2 choices.
2152
0
int32_t svt_av1_get_pred_context_single_ref_p5(const MacroBlockD* xd) {
2153
0
    return get_pred_context_last3_or_gld(xd);
2154
0
}
2155
2156
// For the bit to signal whether the single reference is ALTREF2_FRAME or
2157
// BWDREF_FRAME, knowing that it shall be either of these 2 choices.
2158
0
int32_t svt_av1_get_pred_context_single_ref_p6(const MacroBlockD* xd) {
2159
0
    return get_pred_context_brf_or_arf2(xd);
2160
0
}
2161
2162
/***************************************************************************************/
2163
2164
0
static void write_ref_frames(PictureParentControlSet* pcs, const MacroBlockD* xd, AomWriter* w) {
2165
0
    FrameHeader*            frm_hdr     = &pcs->frm_hdr;
2166
0
    const MbModeInfo* const mbmi        = xd->mi[0];
2167
0
    const int               is_compound = has_second_ref(&mbmi->block_mi);
2168
0
    {
2169
        // does the feature use compound prediction or not
2170
        // (if not specified at the frame/segment level)
2171
0
        if (frm_hdr->reference_mode == REFERENCE_MODE_SELECT) {
2172
0
            if (is_comp_ref_allowed(mbmi->bsize)) {
2173
0
                aom_write_symbol(w, is_compound, svt_aom_get_reference_mode_cdf(xd), 2);
2174
0
            }
2175
0
        } else {
2176
0
            assert((!is_compound) == (frm_hdr->reference_mode == SINGLE_REFERENCE));
2177
0
        }
2178
2179
0
        if (is_compound) {
2180
0
            const CompReferenceType comp_ref_type = has_uni_comp_refs(&mbmi->block_mi) ? UNIDIR_COMP_REFERENCE
2181
0
                                                                                       : BIDIR_COMP_REFERENCE;
2182
0
            aom_write_symbol(w, comp_ref_type, svt_aom_get_comp_reference_type_cdf(xd), 2);
2183
2184
0
            if (comp_ref_type == UNIDIR_COMP_REFERENCE) {
2185
0
                const int bit = mbmi->block_mi.ref_frame[0] == BWDREF_FRAME;
2186
0
                WRITE_REF_BIT(bit, uni_comp_ref_p);
2187
2188
0
                if (!bit) {
2189
0
                    assert(mbmi->block_mi.ref_frame[0] == LAST_FRAME);
2190
0
                    const int bit1 = mbmi->block_mi.ref_frame[1] == LAST3_FRAME ||
2191
0
                        mbmi->block_mi.ref_frame[1] == GOLDEN_FRAME;
2192
0
                    WRITE_REF_BIT(bit1, uni_comp_ref_p1);
2193
0
                    if (bit1) {
2194
0
                        const int bit2 = mbmi->block_mi.ref_frame[1] == GOLDEN_FRAME;
2195
0
                        WRITE_REF_BIT(bit2, uni_comp_ref_p2);
2196
0
                    }
2197
0
                } else {
2198
0
                    assert(mbmi->block_mi.ref_frame[1] == ALTREF_FRAME);
2199
0
                }
2200
0
                return;
2201
0
            }
2202
2203
0
            assert(comp_ref_type == BIDIR_COMP_REFERENCE);
2204
2205
0
            const int bit = (mbmi->block_mi.ref_frame[0] == GOLDEN_FRAME || mbmi->block_mi.ref_frame[0] == LAST3_FRAME);
2206
0
            WRITE_REF_BIT(bit, comp_ref_p);
2207
2208
0
            if (!bit) {
2209
0
                const int bit1 = mbmi->block_mi.ref_frame[0] == LAST2_FRAME;
2210
0
                WRITE_REF_BIT(bit1, comp_ref_p1);
2211
0
            } else {
2212
0
                const int bit2 = mbmi->block_mi.ref_frame[0] == GOLDEN_FRAME;
2213
0
                WRITE_REF_BIT(bit2, comp_ref_p2);
2214
0
            }
2215
2216
0
            const int bit_bwd = mbmi->block_mi.ref_frame[1] == ALTREF_FRAME;
2217
0
            WRITE_REF_BIT(bit_bwd, comp_bwdref_p);
2218
2219
0
            if (!bit_bwd) {
2220
0
                WRITE_REF_BIT(mbmi->block_mi.ref_frame[1] == ALTREF2_FRAME, comp_bwdref_p1);
2221
0
            }
2222
0
        } else {
2223
0
            const int bit0 = (mbmi->block_mi.ref_frame[0] <= ALTREF_FRAME &&
2224
0
                              mbmi->block_mi.ref_frame[0] >= BWDREF_FRAME);
2225
0
            WRITE_REF_BIT(bit0, single_ref_p1);
2226
2227
0
            if (bit0) {
2228
0
                const int bit1 = mbmi->block_mi.ref_frame[0] == ALTREF_FRAME;
2229
0
                WRITE_REF_BIT(bit1, single_ref_p2);
2230
0
                if (!bit1) {
2231
0
                    WRITE_REF_BIT(mbmi->block_mi.ref_frame[0] == ALTREF2_FRAME, single_ref_p6);
2232
0
                }
2233
0
            } else {
2234
0
                const int bit2 = (mbmi->block_mi.ref_frame[0] == LAST3_FRAME ||
2235
0
                                  mbmi->block_mi.ref_frame[0] == GOLDEN_FRAME);
2236
0
                WRITE_REF_BIT(bit2, single_ref_p3);
2237
0
                if (!bit2) {
2238
0
                    const int bit3 = mbmi->block_mi.ref_frame[0] != LAST_FRAME;
2239
0
                    WRITE_REF_BIT(bit3, single_ref_p4);
2240
0
                } else {
2241
0
                    const int bit4 = mbmi->block_mi.ref_frame[0] != LAST3_FRAME;
2242
0
                    WRITE_REF_BIT(bit4, single_ref_p5);
2243
0
                }
2244
0
            }
2245
0
        }
2246
0
    }
2247
0
}
2248
2249
0
static void encode_restoration_mode(PictureParentControlSet* pcs, AomWriteBitBuffer* wb) {
2250
0
    FrameHeader* frm_hdr = &pcs->frm_hdr;
2251
    //SVT_ERROR("encode_restoration_mode might not work. Double check the reference code\n");
2252
0
    assert(!frm_hdr->all_lossless);
2253
    // move out side of the function
2254
    //if (!cm->seq_params.enable_restoration) return;
2255
2256
0
    if (frm_hdr->allow_intrabc) {
2257
0
        return;
2258
0
    }
2259
2260
0
    const int32_t num_planes = 3; // av1_num_planes(cm);
2261
0
    int32_t       all_none = 1, chroma_none = 1;
2262
0
    for (int32_t p = 0; p < num_planes; ++p) {
2263
0
        RestorationInfo* rsi = &pcs->child_pcs->rst_info[p];
2264
2265
0
        if (rsi->frame_restoration_type != RESTORE_NONE) {
2266
0
            all_none = 0;
2267
0
            chroma_none &= (int32_t)(p == 0);
2268
0
        }
2269
0
        switch (rsi->frame_restoration_type) {
2270
0
        case RESTORE_NONE:
2271
0
            svt_aom_wb_write_bit(wb, 0);
2272
0
            svt_aom_wb_write_bit(wb, 0);
2273
0
            break;
2274
0
        case RESTORE_WIENER:
2275
0
            svt_aom_wb_write_bit(wb, 1);
2276
0
            svt_aom_wb_write_bit(wb, 0);
2277
0
            break;
2278
0
        case RESTORE_SGRPROJ:
2279
0
            svt_aom_wb_write_bit(wb, 1);
2280
0
            svt_aom_wb_write_bit(wb, 1);
2281
0
            break;
2282
0
        case RESTORE_SWITCHABLE:
2283
0
            svt_aom_wb_write_bit(wb, 0);
2284
0
            svt_aom_wb_write_bit(wb, 1);
2285
0
            break;
2286
0
        default:
2287
0
            assert(0);
2288
0
        }
2289
0
    }
2290
0
    if (!all_none) {
2291
0
        const int32_t    sb_size = pcs->scs->seq_header.sb_size == BLOCK_128X128 ? 128 : 64;
2292
0
        RestorationInfo* rsi     = &pcs->child_pcs->rst_info[0];
2293
0
        assert(rsi->restoration_unit_size >= sb_size);
2294
0
        assert(RESTORATION_UNITSIZE_MAX == 256);
2295
2296
0
        if (sb_size == 64) {
2297
0
            svt_aom_wb_write_bit(wb, rsi->restoration_unit_size > 64);
2298
0
        }
2299
0
        if (rsi->restoration_unit_size > 64) {
2300
0
            svt_aom_wb_write_bit(wb, rsi->restoration_unit_size > 128);
2301
0
        }
2302
0
    }
2303
0
    if (!chroma_none) {
2304
0
        svt_aom_wb_write_bit(
2305
0
            wb, pcs->child_pcs->rst_info[1].restoration_unit_size != pcs->child_pcs->rst_info[0].restoration_unit_size);
2306
0
        assert(pcs->child_pcs->rst_info[1].restoration_unit_size == pcs->child_pcs->rst_info[0].restoration_unit_size ||
2307
0
               pcs->child_pcs->rst_info[1].restoration_unit_size ==
2308
0
                   (pcs->child_pcs->rst_info[0].restoration_unit_size >> 1));
2309
0
        assert(pcs->child_pcs->rst_info[2].restoration_unit_size == pcs->child_pcs->rst_info[1].restoration_unit_size);
2310
0
    }
2311
0
}
2312
2313
860
static void encode_segmentation(PictureParentControlSet* pcs, AomWriteBitBuffer* wb) {
2314
860
    SegmentationParams* segmentation_params = &pcs->frm_hdr.segmentation_params;
2315
860
    svt_aom_wb_write_bit(wb, segmentation_params->segmentation_enabled);
2316
860
    if (segmentation_params->segmentation_enabled) {
2317
0
        if (!(pcs->frm_hdr.primary_ref_frame == PRIMARY_REF_NONE)) {
2318
0
            svt_aom_wb_write_bit(wb, segmentation_params->segmentation_update_map);
2319
0
            if (segmentation_params->segmentation_update_map) {
2320
0
                svt_aom_wb_write_bit(wb, segmentation_params->segmentation_temporal_update);
2321
0
            }
2322
0
            svt_aom_wb_write_bit(wb, segmentation_params->segmentation_update_data);
2323
0
        }
2324
0
        if (segmentation_params->segmentation_update_data) {
2325
0
            for (int i = 0; i < MAX_SEGMENTS; i++) {
2326
0
                for (int j = 0; j < SEG_LVL_MAX; j++) {
2327
0
                    svt_aom_wb_write_bit(wb, segmentation_params->feature_enabled[i][j]);
2328
0
                    if (segmentation_params->feature_enabled[i][j]) {
2329
                        //TODO: add clamping
2330
0
                        if (svt_aom_segmentation_feature_signed[j]) {
2331
0
                            svt_aom_wb_write_inv_signed_literal(
2332
0
                                wb, segmentation_params->feature_data[i][j], svt_aom_segmentation_feature_bits[j]);
2333
0
                        } else {
2334
0
                            svt_aom_wb_write_literal(
2335
0
                                wb, segmentation_params->feature_data[i][j], svt_aom_segmentation_feature_bits[j]);
2336
0
                        }
2337
0
                    }
2338
0
                }
2339
0
            }
2340
0
        }
2341
0
    }
2342
860
}
2343
2344
490
static void encode_loopfilter(PictureParentControlSet* pcs, AomWriteBitBuffer* wb) {
2345
490
    FrameHeader* frm_hdr = &pcs->frm_hdr;
2346
490
    assert(!frm_hdr->coded_lossless);
2347
490
    if (frm_hdr->allow_intrabc) {
2348
0
        return;
2349
0
    }
2350
2351
490
    LoopFilter* lf = &frm_hdr->loop_filter_params;
2352
2353
    // Encode the loop filter level and type
2354
490
    svt_aom_wb_write_literal(wb, lf->filter_level[0], 6);
2355
490
    svt_aom_wb_write_literal(wb, lf->filter_level[1], 6);
2356
490
    if (lf->filter_level[0] || lf->filter_level[1]) {
2357
462
        svt_aom_wb_write_literal(wb, lf->filter_level_u, 6);
2358
462
        svt_aom_wb_write_literal(wb, lf->filter_level_v, 6);
2359
462
    }
2360
490
    svt_aom_wb_write_literal(wb, lf->sharpness_level, 3);
2361
2362
    // Write out loop filter deltas applied at the MB level based on mode or
2363
    // ref frame (if they are enabled).
2364
490
    svt_aom_wb_write_bit(wb, lf->mode_ref_delta_enabled);
2365
490
    if (lf->mode_ref_delta_enabled) {
2366
0
        SVT_ERROR("Loop Filter is not supported yet \n");
2367
        /* svt_aom_wb_write_bit(wb, lf->mode_ref_delta_update);
2368
        if (lf->mode_ref_delta_update) {
2369
        const int32_t prime_idx = pcs->primary_ref_frame;
2370
        const int32_t buf_idx =
2371
        prime_idx == PRIMARY_REF_NONE ? -1 : cm->frame_refs[prime_idx].idx;
2372
        int8_t last_ref_deltas[TOTAL_REFS_PER_FRAME];
2373
        if (prime_idx == PRIMARY_REF_NONE || buf_idx < 0) {
2374
        av1_set_default_ref_deltas(last_ref_deltas);
2375
        } else {
2376
        svt_memcpy(last_ref_deltas, cm->buffer_pool->frame_bufs[buf_idx].ref_deltas,
2377
        TOTAL_REFS_PER_FRAME);
2378
        }
2379
        for (i = 0; i < TOTAL_REFS_PER_FRAME; i++) {
2380
        const int32_t delta = lf->ref_deltas[i];
2381
        const int32_t changed = delta != last_ref_deltas[i];
2382
        svt_aom_wb_write_bit(wb, changed);
2383
        if (changed) svt_aom_wb_write_inv_signed_literal(wb, delta, 6);
2384
        }
2385
        int8_t last_mode_deltas[MAX_MODE_LF_DELTAS];
2386
        if (prime_idx == PRIMARY_REF_NONE || buf_idx < 0) {
2387
        av1_set_default_mode_deltas(last_mode_deltas);
2388
        } else {
2389
        svt_memcpy(last_mode_deltas,
2390
        cm->buffer_pool->frame_bufs[buf_idx].mode_deltas,
2391
        MAX_MODE_LF_DELTAS);
2392
        }
2393
2394
        for (i = 0; i < MAX_MODE_LF_DELTAS; i++) {
2395
        const int32_t delta = lf->mode_deltas[i];
2396
        const int32_t changed = delta != last_mode_deltas[i];
2397
        svt_aom_wb_write_bit(wb, changed);
2398
        if (changed) svt_aom_wb_write_inv_signed_literal(wb, delta, 6);
2399
        }
2400
        }*/
2401
0
    }
2402
490
}
2403
2404
490
static void encode_cdef(const PictureParentControlSet* pcs, AomWriteBitBuffer* wb) {
2405
    //assert(!cm->coded_lossless);
2406
    // moved out side
2407
    //if (!cm->seq_params.cdef_level) return;
2408
2409
490
    const FrameHeader* frm_hdr = &pcs->frm_hdr;
2410
2411
490
    if (frm_hdr->allow_intrabc) {
2412
0
        return;
2413
0
    }
2414
2415
490
    svt_aom_wb_write_literal(wb, frm_hdr->cdef_params.cdef_damping - 3, 2);
2416
    //cdef_pri_damping & cdef_sec_damping consolidated to cdef_damping
2417
    //assert(pcs->cdef_pri_damping == pcs->cdef_sec_damping);
2418
490
    svt_aom_wb_write_literal(wb, frm_hdr->cdef_params.cdef_bits, 2);
2419
980
    for (int32_t i = 0; i < pcs->nb_cdef_strengths; i++) {
2420
490
        svt_aom_wb_write_literal(wb, frm_hdr->cdef_params.cdef_y_strength[i], CDEF_STRENGTH_BITS);
2421
490
        svt_aom_wb_write_literal(wb, frm_hdr->cdef_params.cdef_uv_strength[i], CDEF_STRENGTH_BITS);
2422
490
    }
2423
490
}
2424
2425
2.58k
static void write_delta_q(AomWriteBitBuffer* wb, int32_t delta_q) {
2426
2.58k
    if (delta_q != 0) {
2427
0
        svt_aom_wb_write_bit(wb, 1);
2428
0
        svt_aom_wb_write_inv_signed_literal(wb, delta_q, 6);
2429
2.58k
    } else {
2430
2.58k
        svt_aom_wb_write_bit(wb, 0);
2431
2.58k
    }
2432
2.58k
}
2433
2434
860
static void encode_quantization(const PictureParentControlSet* const pcs, AomWriteBitBuffer* wb) {
2435
860
    const FrameHeader* frm_hdr = &pcs->frm_hdr;
2436
860
    svt_aom_wb_write_literal(wb, frm_hdr->quantization_params.base_q_idx, QINDEX_BITS);
2437
860
    write_delta_q(wb, frm_hdr->quantization_params.delta_q_dc[PLANE_Y]);
2438
860
    int32_t diff_uv_delta = (frm_hdr->quantization_params.delta_q_dc[PLANE_U] !=
2439
860
                             frm_hdr->quantization_params.delta_q_dc[PLANE_V]) ||
2440
860
        (frm_hdr->quantization_params.delta_q_ac[PLANE_U] != frm_hdr->quantization_params.delta_q_ac[PLANE_V]);
2441
2442
860
    if (diff_uv_delta) {
2443
0
        svt_aom_wb_write_bit(wb, diff_uv_delta);
2444
0
    }
2445
860
    write_delta_q(wb, frm_hdr->quantization_params.delta_q_dc[PLANE_U]);
2446
860
    write_delta_q(wb, frm_hdr->quantization_params.delta_q_ac[PLANE_U]);
2447
860
    if (diff_uv_delta) {
2448
0
        write_delta_q(wb, frm_hdr->quantization_params.delta_q_dc[PLANE_V]);
2449
0
        write_delta_q(wb, frm_hdr->quantization_params.delta_q_ac[PLANE_V]);
2450
0
    }
2451
860
    svt_aom_wb_write_bit(wb, frm_hdr->quantization_params.using_qmatrix);
2452
860
    if (frm_hdr->quantization_params.using_qmatrix) {
2453
0
        svt_aom_wb_write_literal(wb, frm_hdr->quantization_params.qm[PLANE_Y], QM_LEVEL_BITS);
2454
0
        svt_aom_wb_write_literal(wb, frm_hdr->quantization_params.qm[PLANE_U], QM_LEVEL_BITS);
2455
0
        if (!diff_uv_delta) {
2456
0
            assert(frm_hdr->quantization_params.qm[PLANE_U] == frm_hdr->quantization_params.qm[PLANE_V]);
2457
0
        } else {
2458
0
            svt_aom_wb_write_literal(wb, frm_hdr->quantization_params.qm[PLANE_V], QM_LEVEL_BITS);
2459
0
        }
2460
0
    }
2461
860
}
2462
2463
860
static void write_tile_info_max_tile(const PictureParentControlSet* const pcs, AomWriteBitBuffer* wb) {
2464
860
    Av1Common* cm = pcs->av1_cm;
2465
860
    svt_aom_wb_write_bit(wb, cm->tiles_info.uniform_tile_spacing_flag);
2466
2467
860
    if (cm->tiles_info.uniform_tile_spacing_flag) {
2468
        // Uniform spaced tiles with power-of-two number of rows and columns
2469
        // tile columns
2470
860
        int32_t ones = cm->log2_tile_cols - cm->tiles_info.min_log2_tile_cols;
2471
2.39k
        while (ones--) {
2472
1.53k
            svt_aom_wb_write_bit(wb, 1);
2473
1.53k
        }
2474
860
        if (cm->log2_tile_cols < cm->tiles_info.max_log2_tile_cols) {
2475
224
            svt_aom_wb_write_bit(wb, 0);
2476
224
        }
2477
        // rows
2478
860
        cm->tiles_info.min_log2_tile_rows = AOMMAX(cm->tiles_info.min_log2_tiles - cm->log2_tile_cols, 0);
2479
860
        ones                              = cm->log2_tile_rows - cm->tiles_info.min_log2_tile_rows;
2480
2.33k
        while (ones--) {
2481
1.47k
            svt_aom_wb_write_bit(wb, 1);
2482
1.47k
        }
2483
860
        if (cm->log2_tile_rows < cm->tiles_info.max_log2_tile_rows) {
2484
102
            svt_aom_wb_write_bit(wb, 0);
2485
102
        }
2486
860
    } else {
2487
        // Explicit tiles with configurable tile widths and heights
2488
0
        SVT_ERROR("NON uniform_tile_spacing_flag not supported yet\n");
2489
        //// columns
2490
        // int sb_size_log2 = pcs->scs->seq_header.sb_size_log2;
2491
        //for (i = 0; i < cm->tile_cols; i++) {
2492
        //    size_sb = (cm->tile_col_start_mi[i + 1] - cm->tile_col_start_mi[i]) >> sb_size_log2;
2493
        //    wb_write_uniform(wb, AOMMIN(width_sb, cm->max_tile_width_sb),
2494
        //        size_sb - 1);
2495
        //    width_sb -= size_sb;
2496
        //}
2497
        //assert(width_sb == 0);
2498
2499
        //// rows
2500
        //for (i = 0; i < cm->tile_rows; i++) {
2501
        //    size_sb = (cm->tile_row_start_mi[i + 1] - cm->tile_row_start_mi[i]) >> sb_size_log2;
2502
        //    wb_write_uniform(wb, AOMMIN(height_sb, cm->max_tile_height_sb),
2503
        //        size_sb - 1);
2504
        //    height_sb -= size_sb;
2505
        //}
2506
        //assert(height_sb == 0);
2507
0
    }
2508
860
}
2509
2510
3.01k
void svt_av1_get_tile_limits(PictureParentControlSet* pcs) {
2511
3.01k
    Av1Common* cm = pcs->av1_cm;
2512
2513
3.01k
    int32_t mi_cols                  = ALIGN_POWER_OF_TWO(cm->mi_cols, pcs->log2_sb_size);
2514
3.01k
    int32_t mi_rows                  = ALIGN_POWER_OF_TWO(cm->mi_rows, pcs->log2_sb_size);
2515
3.01k
    int32_t sb_cols                  = mi_cols >> pcs->log2_sb_size;
2516
3.01k
    int32_t sb_rows                  = mi_rows >> pcs->log2_sb_size;
2517
3.01k
    int32_t sb_size_log2             = pcs->log2_sb_size + MI_SIZE_LOG2;
2518
3.01k
    cm->tiles_info.max_tile_width_sb = MAX_TILE_WIDTH >> sb_size_log2;
2519
3.01k
    int32_t max_tile_area_sb         = MAX_TILE_AREA >> (2 * sb_size_log2);
2520
2521
3.01k
    cm->tiles_info.min_log2_tile_cols = tile_log2(cm->tiles_info.max_tile_width_sb, sb_cols);
2522
3.01k
    cm->tiles_info.max_log2_tile_cols = tile_log2(1, AOMMIN(sb_cols, MAX_TILE_COLS));
2523
3.01k
    cm->tiles_info.max_log2_tile_rows = tile_log2(1, AOMMIN(sb_rows, MAX_TILE_ROWS));
2524
3.01k
    cm->tiles_info.min_log2_tile_rows = 0; // CHKN Tiles
2525
3.01k
    cm->tiles_info.min_log2_tiles     = tile_log2(max_tile_area_sb, sb_cols * sb_rows);
2526
3.01k
    cm->tiles_info.min_log2_tiles     = AOMMAX(cm->tiles_info.min_log2_tiles, cm->tiles_info.min_log2_tile_cols);
2527
3.01k
}
2528
2529
2.15k
void svt_av1_calculate_tile_cols(PictureParentControlSet* pcs) {
2530
2.15k
    Av1Common* const cm = pcs->av1_cm;
2531
2532
2.15k
    const int mi_cols      = ALIGN_POWER_OF_TWO(cm->mi_cols, pcs->log2_sb_size);
2533
2.15k
    const int mi_rows      = ALIGN_POWER_OF_TWO(cm->mi_rows, pcs->log2_sb_size);
2534
2.15k
    const int sb_cols      = mi_cols >> pcs->log2_sb_size;
2535
2.15k
    const int sb_rows      = mi_rows >> pcs->log2_sb_size;
2536
2.15k
    const int sb_size_log2 = pcs->log2_sb_size;
2537
2538
2.15k
    if (cm->tiles_info.uniform_tile_spacing_flag) {
2539
2.15k
        int size_sb = ALIGN_POWER_OF_TWO(sb_cols, cm->log2_tile_cols);
2540
2.15k
        size_sb >>= cm->log2_tile_cols;
2541
2.15k
        assert(size_sb > 0);
2542
2.15k
        int i = 0;
2543
9.13k
        for (int start_sb = 0; start_sb < sb_cols; i++) {
2544
6.98k
            cm->tiles_info.tile_col_start_mi[i] = start_sb << sb_size_log2;
2545
6.98k
            start_sb += size_sb;
2546
6.98k
        }
2547
2.15k
        cm->tiles_info.tile_cols            = i;
2548
2.15k
        cm->tiles_info.tile_col_start_mi[i] = sb_cols << sb_size_log2;
2549
2.15k
        cm->tiles_info.min_log2_tile_rows   = AOMMAX(cm->tiles_info.min_log2_tiles - cm->log2_tile_cols, 0);
2550
2.15k
        cm->tiles_info.max_tile_height_sb   = sb_rows >> cm->tiles_info.min_log2_tile_rows;
2551
2552
2.15k
        cm->tile_width = size_sb << pcs->log2_sb_size;
2553
2.15k
        cm->tile_width = AOMMIN(cm->tile_width, cm->mi_cols);
2554
2.15k
    } else {
2555
0
        int max_tile_area_sb = (sb_rows * sb_cols);
2556
0
        int widest_tile_sb   = 1;
2557
0
        cm->log2_tile_cols   = tile_log2(1, cm->tiles_info.tile_cols);
2558
0
        for (int i = 0; i < cm->tiles_info.tile_cols; i++) {
2559
0
            int size_sb = (cm->tiles_info.tile_col_start_mi[i + 1] - cm->tiles_info.tile_col_start_mi[i]) >>
2560
0
                sb_size_log2;
2561
0
            widest_tile_sb = AOMMAX(widest_tile_sb, size_sb);
2562
0
        }
2563
0
        if (cm->tiles_info.min_log2_tiles) {
2564
0
            max_tile_area_sb >>= (cm->tiles_info.min_log2_tiles + 1);
2565
0
        }
2566
2567
0
        cm->tiles_info.max_tile_height_sb = AOMMAX(max_tile_area_sb / widest_tile_sb, 1);
2568
0
    }
2569
2.15k
}
2570
2571
2.15k
void svt_av1_calculate_tile_rows(PictureParentControlSet* pcs) {
2572
2.15k
    Av1Common* const cm = pcs->av1_cm;
2573
2574
2.15k
    int mi_rows      = ALIGN_POWER_OF_TWO(cm->mi_rows, pcs->log2_sb_size);
2575
2.15k
    int sb_rows      = mi_rows >> pcs->log2_sb_size;
2576
2.15k
    int sb_size_log2 = pcs->log2_sb_size;
2577
2578
2.15k
    if (cm->tiles_info.uniform_tile_spacing_flag) {
2579
2.15k
        int size_sb = ALIGN_POWER_OF_TWO(sb_rows, cm->log2_tile_rows);
2580
2.15k
        size_sb >>= cm->log2_tile_rows;
2581
2.15k
        assert(size_sb > 0);
2582
2.15k
        int i = 0;
2583
8.91k
        for (int start_sb = 0; start_sb < sb_rows; i++) {
2584
6.76k
            cm->tiles_info.tile_row_start_mi[i] = start_sb << sb_size_log2;
2585
6.76k
            start_sb += size_sb;
2586
6.76k
        }
2587
2.15k
        cm->tiles_info.tile_rows            = i;
2588
2.15k
        cm->tiles_info.tile_row_start_mi[i] = sb_rows << sb_size_log2;
2589
2590
2.15k
        cm->tile_height = size_sb << pcs->log2_sb_size;
2591
2.15k
        cm->tile_height = AOMMIN(cm->tile_height, cm->mi_rows);
2592
2.15k
    } else {
2593
0
        cm->log2_tile_rows = tile_log2(1, cm->tiles_info.tile_rows);
2594
0
    }
2595
2.15k
}
2596
2597
2.15k
void svt_aom_set_tile_info(PictureParentControlSet* pcs) {
2598
    /*  Tiling algorithm:
2599
        input : log2_tile_count ==> tile_count = 1<<log2_tile_count
2600
2601
        step1) compute pic_size_in_sb
2602
        step2) then round up to the closed n.tile_count.
2603
        step3) tile_size = rounded_pic_size_in_sb / tile_count.
2604
        step4) we fill tiles of size tile_size until we reach the end of the pic
2605
2606
        Note that: the last tile could have smaller size, and the final number
2607
        of tiles could be less than tile_count
2608
     */
2609
2610
2.15k
    Av1Common* cm = pcs->av1_cm;
2611
    //to connect later if non uniform tile spacing is needed.
2612
2613
2.15k
    svt_av1_get_tile_limits(pcs);
2614
2615
    // configure tile columns
2616
2.15k
    cm->tiles_info.uniform_tile_spacing_flag = 1;
2617
2.15k
    cm->log2_tile_cols                       = AOMMAX(pcs->log2_tile_cols, cm->tiles_info.min_log2_tile_cols);
2618
2.15k
    cm->log2_tile_cols                       = AOMMIN(cm->log2_tile_cols, cm->tiles_info.max_log2_tile_cols);
2619
2620
2.15k
    svt_av1_calculate_tile_cols(pcs);
2621
2622
    // configure tile rows
2623
2.15k
    if (cm->tiles_info.uniform_tile_spacing_flag) {
2624
2.15k
        cm->log2_tile_rows = AOMMAX(pcs->log2_tile_rows, cm->tiles_info.min_log2_tile_rows);
2625
2.15k
        cm->log2_tile_rows = AOMMIN(cm->log2_tile_rows, cm->tiles_info.max_log2_tile_rows);
2626
2.15k
    } else {
2627
0
        int       i            = 0;
2628
0
        const int mi_rows      = ALIGN_POWER_OF_TWO(cm->mi_rows, pcs->log2_sb_size);
2629
0
        const int sb_rows      = mi_rows >> pcs->log2_sb_size;
2630
0
        const int sb_size_log2 = pcs->scs->seq_header.sb_size_log2;
2631
0
        for (int start_sb = 0; start_sb < sb_rows && i < MAX_TILE_ROWS; i++) {
2632
0
            cm->tiles_info.tile_row_start_mi[i] = start_sb << sb_size_log2;
2633
0
            start_sb += cm->tiles_info.max_tile_height_sb;
2634
0
        }
2635
0
        cm->tiles_info.tile_rows            = i;
2636
0
        cm->tiles_info.tile_row_start_mi[i] = sb_rows << sb_size_log2;
2637
0
    }
2638
2.15k
    svt_av1_calculate_tile_rows(pcs);
2639
2.15k
}
2640
2641
860
static void write_tile_info(const PictureParentControlSet* const pcs, AomWriteBitBuffer* wb) {
2642
860
    Av1Common* const cm                     = pcs->av1_cm;
2643
860
    uint16_t         tile_cnt               = cm->tiles_info.tile_rows * cm->tiles_info.tile_cols;
2644
860
    pcs->child_pcs->tile_size_bytes_minus_1 = 0;
2645
860
    svt_av1_get_tile_limits((PictureParentControlSet*)pcs);
2646
860
    write_tile_info_max_tile(pcs, wb);
2647
2648
860
    if (pcs->av1_cm->tiles_info.tile_rows * pcs->av1_cm->tiles_info.tile_cols > 1) {
2649
        // tile id used for cdf update
2650
        // Force each frame to update their data so future frames can use it,
2651
        // even if the current frame did not use it.  This enables REF frames to
2652
        // have the feature off, while NREF frames can have it on.  Used for multi-threading.
2653
850
        svt_aom_wb_write_literal(wb,
2654
850
                                 pcs->av1_cm->tiles_info.tile_rows * pcs->av1_cm->tiles_info.tile_cols - 1,
2655
850
                                 pcs->av1_cm->log2_tile_cols + pcs->av1_cm->log2_tile_rows);
2656
2657
        // Number of bytes in tile size - 1
2658
850
        uint32_t max_tile_size = 0;
2659
9.05k
        for (int tile_idx = 0; tile_idx < tile_cnt - 1; tile_idx++) {
2660
8.20k
            max_tile_size = AOMMAX(max_tile_size, pcs->child_pcs->ec_info[tile_idx]->ec->ec_writer.pos);
2661
8.20k
        }
2662
850
        if (max_tile_size >> 24 != 0) {
2663
0
            pcs->child_pcs->tile_size_bytes_minus_1 = 3;
2664
850
        } else if (max_tile_size >> 16 != 0) {
2665
0
            pcs->child_pcs->tile_size_bytes_minus_1 = 2;
2666
850
        } else if (max_tile_size >> 8 != 0) {
2667
0
            pcs->child_pcs->tile_size_bytes_minus_1 = 1;
2668
850
        } else {
2669
850
            pcs->child_pcs->tile_size_bytes_minus_1 = 0;
2670
850
        }
2671
2672
850
        svt_aom_wb_write_literal(wb, pcs->child_pcs->tile_size_bytes_minus_1, 2); //Jing: Change 3 to smaller size
2673
850
    }
2674
860
}
2675
2676
860
static AOM_INLINE void write_render_size(AomWriteBitBuffer* wb, PictureParentControlSet* ppcs) {
2677
860
    int render_and_frame_size_different = 0;
2678
860
    if (ppcs->frame_resize_enabled) {
2679
0
        render_and_frame_size_different = 1;
2680
0
    }
2681
860
    svt_aom_wb_write_bit(wb, render_and_frame_size_different);
2682
860
    if (!render_and_frame_size_different) {
2683
860
        return;
2684
860
    }
2685
0
    uint32_t render_width_minus_1  = ppcs->render_width - 1;
2686
0
    uint32_t render_height_minus_1 = ppcs->render_height - 1;
2687
0
    svt_aom_wb_write_literal(wb, render_width_minus_1, 16);
2688
0
    svt_aom_wb_write_literal(wb, render_height_minus_1, 16);
2689
0
}
2690
2691
860
static AOM_INLINE void write_superres_scale(AomWriteBitBuffer* wb, PictureParentControlSet* pcs) {
2692
860
    SequenceControlSet* scs            = pcs->scs;
2693
860
    Av1Common*          cm             = pcs->av1_cm;
2694
860
    uint8_t             superres_denom = cm->frm_size.superres_denominator;
2695
2696
860
    if (!scs->seq_header.enable_superres) {
2697
860
        assert(cm->frm_size.superres_denominator == SCALE_NUMERATOR);
2698
860
        return;
2699
860
    }
2700
2701
    // First bit is whether to to scale or not
2702
0
    if (superres_denom == SCALE_NUMERATOR) {
2703
0
        svt_aom_wb_write_bit(wb, 0); // no scaling
2704
0
    } else {
2705
0
        svt_aom_wb_write_bit(wb, 1); // scaling, write scale factor
2706
0
        assert(superres_denom >= SUPERRES_SCALE_DENOMINATOR_MIN);
2707
0
        assert(superres_denom < SUPERRES_SCALE_DENOMINATOR_MIN + (1 << SUPERRES_SCALE_BITS));
2708
0
        svt_aom_wb_write_literal(wb, superres_denom - SUPERRES_SCALE_DENOMINATOR_MIN, SUPERRES_SCALE_BITS);
2709
0
    }
2710
0
}
2711
2712
860
static void write_frame_size(PictureParentControlSet* pcs, int32_t frame_size_override, AomWriteBitBuffer* wb) {
2713
860
    SequenceControlSet* scs = pcs->scs;
2714
860
    (void)(*pcs);
2715
860
    (void)frame_size_override;
2716
860
    Av1Common*    cm           = pcs->av1_cm;
2717
860
    const int32_t coded_width  = cm->frm_size.superres_upscaled_width - 1;
2718
860
    const int32_t coded_height = cm->frm_size.superres_upscaled_height - 1;
2719
2720
860
    if (frame_size_override) {
2721
0
        int32_t num_bits_width  = scs->seq_header.frame_width_bits;
2722
0
        int32_t num_bits_height = scs->seq_header.frame_height_bits;
2723
0
        svt_aom_wb_write_literal(wb, coded_width, num_bits_width);
2724
0
        svt_aom_wb_write_literal(wb, coded_height, num_bits_height);
2725
0
    }
2726
2727
860
    write_superres_scale(wb, pcs);
2728
860
    write_render_size(wb, pcs);
2729
860
}
2730
2731
860
static void write_profile(BitstreamProfile profile, AomWriteBitBuffer* wb) {
2732
860
    assert(profile >= PROFILE_0 && profile < MAX_PROFILES);
2733
860
    svt_aom_wb_write_literal(wb, profile, PROFILE_BITS);
2734
860
}
2735
2736
860
static AOM_INLINE void write_bitdepth(const SequenceControlSet* const scs, AomWriteBitBuffer* wb) {
2737
    // Profile 0/1: [0] for 8 bit, [1]  10-bit
2738
    // Profile   2: [0] for 8 bit, [10] 10-bit, [11] - 12-bit
2739
860
    svt_aom_wb_write_bit(wb, scs->static_config.encoder_bit_depth == EB_EIGHT_BIT ? 0 : 1);
2740
860
    if (scs->static_config.profile == PROFESSIONAL_PROFILE && scs->static_config.encoder_bit_depth != EB_EIGHT_BIT) {
2741
0
        SVT_ERROR("Profile 2 Not supported\n");
2742
0
        svt_aom_wb_write_bit(wb, scs->static_config.encoder_bit_depth == EB_TEN_BIT ? 0 : 1);
2743
0
    }
2744
860
}
2745
2746
860
static AOM_INLINE void write_color_config(const SequenceControlSet* const scs, AomWriteBitBuffer* wb) {
2747
860
    write_bitdepth(scs, wb);
2748
860
    const int is_monochrome = 0; // monochrome is not supported yet
2749
    // monochrome bit
2750
860
    if (scs->static_config.profile != HIGH_PROFILE) {
2751
860
        svt_aom_wb_write_bit(wb, is_monochrome);
2752
860
    } else {
2753
0
        assert(!is_monochrome);
2754
0
    }
2755
860
    if (scs->static_config.color_primaries == EB_CICP_CP_UNSPECIFIED &&
2756
860
        scs->static_config.transfer_characteristics == EB_CICP_TC_UNSPECIFIED &&
2757
860
        scs->static_config.matrix_coefficients == EB_CICP_MC_UNSPECIFIED) {
2758
860
        svt_aom_wb_write_bit(wb, 0); // No color description present
2759
860
    } else {
2760
0
        svt_aom_wb_write_bit(wb, 1); // Color description present
2761
0
        svt_aom_wb_write_literal(wb, scs->static_config.color_primaries, 8);
2762
0
        svt_aom_wb_write_literal(wb, scs->static_config.transfer_characteristics, 8);
2763
0
        svt_aom_wb_write_literal(wb, scs->static_config.matrix_coefficients, 8);
2764
0
    }
2765
    /* if (is_monochrome) {
2766
        // 0: [16, 235] (i.e. xvYCC), 1: [0, 255]
2767
        svt_aom_wb_write_bit(wb, scs->static_config.color_range);
2768
        return;
2769
    } */
2770
860
    if (scs->static_config.color_primaries == EB_CICP_CP_BT_709 &&
2771
0
        scs->static_config.transfer_characteristics == EB_CICP_TC_SRGB &&
2772
0
        scs->static_config.matrix_coefficients == EB_CICP_MC_IDENTITY) {
2773
        /* assert(scs->subsampling_x == 0 && scs->subsampling_y == 0);
2774
        assert(scs->static_config.profile == HIGH_PROFILE ||
2775
               (scs->static_config.profile == PROFESSIONAL_PROFILE && scs->encoder_bit_depth == EB_TWELVE_BIT)); */
2776
860
    } else {
2777
        // 0: [16, 235] (i.e. xvYCC), 1: [0, 255]
2778
860
        svt_aom_wb_write_bit(wb, scs->static_config.color_range);
2779
860
        if (scs->static_config.profile == MAIN_PROFILE) {
2780
            // 420 only
2781
860
            assert(scs->subsampling_x == 1 && scs->subsampling_y == 1);
2782
860
        } else if (scs->static_config.profile == HIGH_PROFILE) {
2783
            // 444 only
2784
0
            assert(scs->subsampling_x == 0 && scs->subsampling_y == 0);
2785
0
        } else if (scs->static_config.profile == PROFESSIONAL_PROFILE) {
2786
0
            if (scs->encoder_bit_depth == EB_TWELVE_BIT) {
2787
                // 420, 444 or 422
2788
0
                svt_aom_wb_write_bit(wb, scs->subsampling_x);
2789
0
                if (scs->subsampling_x == 0) {
2790
0
                    assert(scs->subsampling_y == 0 && "4:4:0 subsampling not allowed in AV1");
2791
0
                } else {
2792
0
                    svt_aom_wb_write_bit(wb, scs->subsampling_y);
2793
0
                }
2794
0
            } else {
2795
                // 422 only
2796
0
                assert(scs->subsampling_x == 1 && scs->subsampling_y == 0);
2797
0
            }
2798
0
        }
2799
860
        if (scs->static_config.matrix_coefficients == EB_CICP_MC_IDENTITY) {
2800
0
            assert(scs->subsampling_x == 0 && scs->subsampling_y == 0);
2801
0
        }
2802
860
        if (scs->subsampling_x == 1 && scs->subsampling_y == 1) {
2803
860
            svt_aom_wb_write_literal(wb, scs->static_config.chroma_sample_position, 2);
2804
860
        }
2805
860
    }
2806
860
    bool separate_uv_delta_q = (scs->static_config.chroma_u_ac_qindex_offset !=
2807
860
                                    scs->static_config.chroma_v_ac_qindex_offset ||
2808
860
                                scs->static_config.chroma_u_dc_qindex_offset !=
2809
860
                                    scs->static_config.chroma_v_dc_qindex_offset);
2810
860
    svt_aom_wb_write_bit(wb, separate_uv_delta_q);
2811
860
}
2812
2813
860
static void write_sequence_header(SequenceControlSet* scs, AomWriteBitBuffer* wb) {
2814
860
    const int32_t max_frame_width   = scs->seq_header.max_frame_width;
2815
860
    const int32_t max_frame_height  = scs->seq_header.max_frame_height;
2816
860
    unsigned      frame_width_bits  = svt_log2f(max_frame_width);
2817
860
    unsigned      frame_height_bits = svt_log2f(max_frame_height);
2818
860
    if (max_frame_width > (1 << frame_width_bits)) {
2819
802
        ++frame_width_bits;
2820
802
    }
2821
860
    if (max_frame_height > (1 << frame_height_bits)) {
2822
804
        ++frame_height_bits;
2823
804
    }
2824
    // AV1 spec requires at least 1 bit for frame dimensions
2825
860
    if (frame_width_bits < 1) {
2826
0
        frame_width_bits = 1;
2827
0
    }
2828
860
    if (frame_height_bits < 1) {
2829
0
        frame_height_bits = 1;
2830
0
    }
2831
860
    scs->seq_header.frame_width_bits  = frame_width_bits;
2832
860
    scs->seq_header.frame_height_bits = frame_height_bits;
2833
2834
860
    svt_aom_wb_write_literal(wb, frame_width_bits - 1, 4);
2835
860
    svt_aom_wb_write_literal(wb, frame_height_bits - 1, 4);
2836
860
    svt_aom_wb_write_literal(wb, max_frame_width - 1, frame_width_bits);
2837
860
    svt_aom_wb_write_literal(wb, max_frame_height - 1, frame_height_bits);
2838
2839
860
    if (!scs->seq_header.reduced_still_picture_header) {
2840
        //scs->frame_id_numbers_present_flag = 0;
2841
        //    cm->large_scale_tile ? 0 : cm->error_resilient_mode;
2842
2843
0
        svt_aom_wb_write_bit(wb, scs->seq_header.frame_id_numbers_present_flag);
2844
0
        if (scs->seq_header.frame_id_numbers_present_flag) {
2845
            // We must always have delta_frame_id_length < frame_id_length,
2846
            // in order for a frame to be referenced with a unique delta.
2847
            // Avoid wasting bits by using a coding that enforces this restriction.
2848
0
            svt_aom_wb_write_literal(wb, scs->seq_header.delta_frame_id_length - 2, 4);
2849
0
            svt_aom_wb_write_literal(
2850
0
                wb, ((scs->seq_header.frame_id_length) - (scs->seq_header.delta_frame_id_length) - 1), 3);
2851
0
        }
2852
0
    }
2853
2854
860
    svt_aom_wb_write_bit(wb, scs->seq_header.sb_size == BLOCK_128X128 ? 1 : 0);
2855
    //    svt_aom_write_sb_size(seq_params, wb);
2856
860
    svt_aom_wb_write_bit(wb, scs->seq_header.filter_intra_level);
2857
860
    svt_aom_wb_write_bit(wb, scs->seq_header.enable_intra_edge_filter);
2858
2859
860
    if (!scs->seq_header.reduced_still_picture_header) {
2860
0
        svt_aom_wb_write_bit(wb, scs->seq_header.enable_interintra_compound);
2861
0
        svt_aom_wb_write_bit(wb, scs->seq_header.enable_masked_compound);
2862
        //        svt_aom_wb_write_bit(wb, scs->static_config.enable_warped_motion);
2863
0
        svt_aom_wb_write_bit(wb, scs->seq_header.enable_warped_motion);
2864
0
        svt_aom_wb_write_bit(wb, scs->seq_header.enable_dual_filter);
2865
2866
0
        svt_aom_wb_write_bit(wb, scs->seq_header.order_hint_info.enable_order_hint);
2867
2868
0
        if (scs->seq_header.order_hint_info.enable_order_hint) {
2869
0
            svt_aom_wb_write_bit(wb, scs->seq_header.order_hint_info.enable_jnt_comp);
2870
0
            svt_aom_wb_write_bit(wb, scs->seq_header.order_hint_info.enable_ref_frame_mvs);
2871
0
        }
2872
2873
0
        if (scs->seq_header.seq_force_screen_content_tools == 2) {
2874
0
            svt_aom_wb_write_bit(wb, 1);
2875
0
        } else {
2876
0
            svt_aom_wb_write_bit(wb, 0);
2877
0
            svt_aom_wb_write_bit(wb, scs->seq_header.seq_force_screen_content_tools);
2878
0
        }
2879
        //
2880
0
        if (scs->seq_header.seq_force_screen_content_tools > 0) {
2881
0
            if (scs->seq_header.seq_force_integer_mv == 2) {
2882
0
                svt_aom_wb_write_bit(wb, 1);
2883
0
            } else {
2884
0
                svt_aom_wb_write_bit(wb, 0);
2885
0
                svt_aom_wb_write_bit(wb, scs->seq_header.seq_force_integer_mv);
2886
0
            }
2887
0
        } else {
2888
0
            assert(scs->seq_header.seq_force_integer_mv == 2);
2889
0
        }
2890
0
        if (scs->seq_header.order_hint_info.enable_order_hint) {
2891
0
            svt_aom_wb_write_literal(wb, scs->seq_header.order_hint_info.order_hint_bits - 1, 3);
2892
0
        }
2893
0
    }
2894
2895
860
    svt_aom_wb_write_bit(wb, scs->seq_header.enable_superres);
2896
860
    svt_aom_wb_write_bit(wb, scs->seq_header.cdef_level);
2897
860
    svt_aom_wb_write_bit(wb, scs->seq_header.enable_restoration);
2898
860
}
2899
2900
// Recenters a non-negative literal v around a reference r
2901
0
static uint16_t recenter_nonneg(uint16_t r, uint16_t v) {
2902
0
    if (v > (r << 1)) {
2903
0
        return v;
2904
0
    } else if (v >= r) {
2905
0
        return ((v - r) << 1);
2906
0
    } else {
2907
0
        return ((r - v) << 1) - 1;
2908
0
    }
2909
0
}
2910
2911
// Recenters a non-negative literal v in [0, n-1] around a
2912
// reference r also in [0, n-1]
2913
0
static uint16_t recenter_finite_nonneg(uint16_t n, uint16_t r, uint16_t v) {
2914
0
    if ((r << 1) <= n) {
2915
0
        return recenter_nonneg(r, v);
2916
0
    } else {
2917
0
        return recenter_nonneg(n - 1 - r, n - 1 - v);
2918
0
    }
2919
0
}
2920
2921
// Encodes a value v in [0, n-1] quasi-uniformly
2922
0
void svt_aom_write_primitive_quniform(AomWriter* w, uint16_t n, uint16_t v) {
2923
0
    if (n <= 1) {
2924
0
        return;
2925
0
    }
2926
0
    const int32_t l = get_msb(n - 1) + 1;
2927
0
    const int32_t m = (1 << l) - n;
2928
0
    if (v < m) {
2929
0
        aom_write_literal(w, v, l - 1);
2930
0
    } else {
2931
0
        aom_write_literal(w, m + ((v - m) >> 1), l - 1);
2932
0
        aom_write_bit(w, (v - m) & 1);
2933
0
    }
2934
0
}
2935
2936
0
static void aom_wb_write_primitive_quniform(AomWriteBitBuffer* wb, uint16_t n, uint16_t v) {
2937
0
    if (n <= 1) {
2938
0
        return;
2939
0
    }
2940
0
    const int32_t l = get_msb(n - 1) + 1;
2941
0
    const int32_t m = (1 << l) - n;
2942
0
    if (v < m) {
2943
0
        svt_aom_wb_write_literal(wb, v, l - 1);
2944
0
    } else {
2945
0
        svt_aom_wb_write_literal(wb, m + ((v - m) >> 1), l - 1);
2946
0
        svt_aom_wb_write_bit(wb, (v - m) & 1);
2947
0
    }
2948
0
}
2949
2950
0
int32_t svt_aom_count_primitive_quniform(uint16_t n, uint16_t v) {
2951
0
    if (n <= 1) {
2952
0
        return 0;
2953
0
    }
2954
0
    const int32_t l = get_msb(n - 1) + 1;
2955
0
    const int32_t m = (1 << l) - n;
2956
0
    return v < m ? l - 1 : l;
2957
0
}
2958
2959
// Finite subexponential code that codes a symbol v in [0, n-1] with parameter k
2960
0
void svt_aom_write_primitive_subexpfin(AomWriter* w, uint16_t n, uint16_t k, uint16_t v) {
2961
0
    int32_t i  = 0;
2962
0
    int32_t mk = 0;
2963
0
    while (1) {
2964
0
        int32_t b = (i ? k + i - 1 : k);
2965
0
        int32_t a = (1 << b);
2966
0
        if (n <= mk + 3 * a) {
2967
0
            svt_aom_write_primitive_quniform(w, (uint16_t)(n - mk), (uint16_t)(v - mk));
2968
0
            break;
2969
0
        } else {
2970
0
            int32_t t = (v >= mk + a);
2971
0
            aom_write_bit(w, t);
2972
0
            if (t) {
2973
0
                i = i + 1;
2974
0
                mk += a;
2975
0
            } else {
2976
0
                aom_write_literal(w, v - mk, b);
2977
0
                break;
2978
0
            }
2979
0
        }
2980
0
    }
2981
0
}
2982
2983
0
static void aom_wb_write_primitive_subexpfin(AomWriteBitBuffer* wb, uint16_t n, uint16_t k, uint16_t v) {
2984
0
    int32_t i  = 0;
2985
0
    int32_t mk = 0;
2986
0
    while (1) {
2987
0
        int32_t b = (i ? k + i - 1 : k);
2988
0
        int32_t a = (1 << b);
2989
0
        if (n <= mk + 3 * a) {
2990
0
            aom_wb_write_primitive_quniform(wb, (uint16_t)(n - mk), (uint16_t)(v - mk));
2991
0
            break;
2992
0
        } else {
2993
0
            int32_t t = (v >= mk + a);
2994
0
            svt_aom_wb_write_bit(wb, t);
2995
0
            if (t) {
2996
0
                i = i + 1;
2997
0
                mk += a;
2998
0
            } else {
2999
0
                svt_aom_wb_write_literal(wb, v - mk, b);
3000
0
                break;
3001
0
            }
3002
0
        }
3003
0
    }
3004
0
}
3005
3006
0
int32_t svt_aom_count_primitive_subexpfin(uint16_t n, uint16_t k, uint16_t v) {
3007
0
    int32_t count = 0;
3008
0
    int32_t i     = 0;
3009
0
    int32_t mk    = 0;
3010
0
    while (1) {
3011
0
        int32_t b = (i ? k + i - 1 : k);
3012
0
        int32_t a = (1 << b);
3013
0
        if (n <= mk + 3 * a) {
3014
0
            count += svt_aom_count_primitive_quniform((uint16_t)(n - mk), (uint16_t)(v - mk));
3015
0
            break;
3016
0
        } else {
3017
0
            int32_t t = (v >= mk + a);
3018
0
            count++;
3019
0
            if (t) {
3020
0
                i = i + 1;
3021
0
                mk += a;
3022
0
            } else {
3023
0
                count += b;
3024
0
                break;
3025
0
            }
3026
0
        }
3027
0
    }
3028
0
    return count;
3029
0
}
3030
3031
// Finite subexponential code that codes a symbol v in[0, n - 1] with parameter k
3032
// based on a reference ref also in [0, n-1].
3033
// Recenters symbol around r first and then uses a finite subexponential code.
3034
0
void svt_aom_write_primitive_refsubexpfin(AomWriter* w, uint16_t n, uint16_t k, uint16_t ref, uint16_t v) {
3035
0
    svt_aom_write_primitive_subexpfin(w, n, k, recenter_finite_nonneg(n, ref, v));
3036
0
}
3037
3038
static void aom_wb_write_primitive_refsubexpfin(AomWriteBitBuffer* wb, uint16_t n, uint16_t k, uint16_t ref,
3039
0
                                                uint16_t v) {
3040
0
    aom_wb_write_primitive_subexpfin(wb, n, k, recenter_finite_nonneg(n, ref, v));
3041
0
}
3042
3043
void svt_aom_wb_write_signed_primitive_refsubexpfin(AomWriteBitBuffer* wb, uint16_t n, uint16_t k, int16_t ref,
3044
0
                                                    int16_t v) {
3045
0
    ref += n - 1;
3046
0
    v += n - 1;
3047
0
    const uint16_t scaled_n = (n << 1) - 1;
3048
0
    aom_wb_write_primitive_refsubexpfin(wb, scaled_n, k, ref, v);
3049
0
}
3050
3051
0
int32_t svt_aom_count_primitive_refsubexpfin(uint16_t n, uint16_t k, uint16_t ref, uint16_t v) {
3052
0
    return svt_aom_count_primitive_subexpfin(n, k, recenter_finite_nonneg(n, ref, v));
3053
0
}
3054
3055
static void write_global_motion_params(const WarpedMotionParams* params, const WarpedMotionParams* ref_params,
3056
0
                                       AomWriteBitBuffer* wb, int32_t allow_hp) {
3057
0
    const TransformationType type = params->wmtype;
3058
0
    svt_aom_wb_write_bit(wb, type != IDENTITY);
3059
0
    if (type != IDENTITY) {
3060
0
        svt_aom_wb_write_bit(wb, type == ROTZOOM);
3061
0
        if (type != ROTZOOM) {
3062
0
            svt_aom_wb_write_bit(wb, type == TRANSLATION);
3063
0
        }
3064
0
    }
3065
3066
0
    if (type >= ROTZOOM) {
3067
0
        int16_t ref2 = (int16_t)((ref_params->wmmat[2] >> GM_ALPHA_PREC_DIFF) - (1 << GM_ALPHA_PREC_BITS));
3068
0
        int16_t v2   = (int16_t)((params->wmmat[2] >> GM_ALPHA_PREC_DIFF) - (1 << GM_ALPHA_PREC_BITS));
3069
3070
0
        int16_t ref3 = (int16_t)(ref_params->wmmat[3] >> GM_ALPHA_PREC_DIFF);
3071
0
        int16_t v3   = (int16_t)(params->wmmat[3] >> GM_ALPHA_PREC_DIFF);
3072
3073
0
        svt_aom_wb_write_signed_primitive_refsubexpfin(
3074
0
            wb,
3075
0
            GM_ALPHA_MAX + 1,
3076
0
            SUBEXPFIN_K,
3077
0
            ref2 /*(ref_params->wmmat[2] >> GM_ALPHA_PREC_DIFF) - (1 << GM_ALPHA_PREC_BITS)*/,
3078
0
            v2 /*(int16_t)((params->wmmat[2] >> GM_ALPHA_PREC_DIFF) - (1 << GM_ALPHA_PREC_BITS))*/);
3079
0
        svt_aom_wb_write_signed_primitive_refsubexpfin(wb,
3080
0
                                                       GM_ALPHA_MAX + 1,
3081
0
                                                       SUBEXPFIN_K,
3082
0
                                                       ref3 /*(ref_params->wmmat[3] >> GM_ALPHA_PREC_DIFF)*/,
3083
0
                                                       v3 /*(int16_t)(params->wmmat[3] >> GM_ALPHA_PREC_DIFF)*/);
3084
0
    }
3085
3086
0
    if (type >= AFFINE) {
3087
0
        int16_t ref4 = (int16_t)(ref_params->wmmat[4] >> GM_ALPHA_PREC_DIFF);
3088
0
        int16_t v4   = (int16_t)(params->wmmat[4] >> GM_ALPHA_PREC_DIFF);
3089
3090
0
        int16_t ref5 = (int16_t)((ref_params->wmmat[5] >> GM_ALPHA_PREC_DIFF) - (1 << GM_ALPHA_PREC_BITS));
3091
0
        int16_t v5   = (int16_t)((params->wmmat[5] >> GM_ALPHA_PREC_DIFF) - (1 << GM_ALPHA_PREC_BITS));
3092
3093
0
        svt_aom_wb_write_signed_primitive_refsubexpfin(wb,
3094
0
                                                       GM_ALPHA_MAX + 1,
3095
0
                                                       SUBEXPFIN_K,
3096
0
                                                       ref4 /*(ref_params->wmmat[4] >> GM_ALPHA_PREC_DIFF)*/,
3097
0
                                                       v4 /*(int16_t)(params->wmmat[4] >> GM_ALPHA_PREC_DIFF)*/);
3098
0
        svt_aom_wb_write_signed_primitive_refsubexpfin(
3099
0
            wb,
3100
0
            GM_ALPHA_MAX + 1,
3101
0
            SUBEXPFIN_K,
3102
0
            ref5 /*(ref_params->wmmat[5] >> GM_ALPHA_PREC_DIFF) -    (1 << GM_ALPHA_PREC_BITS)*/,
3103
0
            v5 /*(int16_t)(params->wmmat[5] >> GM_ALPHA_PREC_DIFF) - (1 << GM_ALPHA_PREC_BITS)*/);
3104
0
    }
3105
3106
0
    if (type >= TRANSLATION) {
3107
0
        const int32_t trans_bits      = (type == TRANSLATION) ? GM_ABS_TRANS_ONLY_BITS - !allow_hp : GM_ABS_TRANS_BITS;
3108
0
        const int32_t trans_prec_diff = (type == TRANSLATION) ? GM_TRANS_ONLY_PREC_DIFF + !allow_hp
3109
0
                                                              : GM_TRANS_PREC_DIFF;
3110
0
        svt_aom_wb_write_signed_primitive_refsubexpfin(wb,
3111
0
                                                       (1 << trans_bits) + 1,
3112
0
                                                       SUBEXPFIN_K,
3113
0
                                                       (int16_t)(ref_params->wmmat[0] >> trans_prec_diff),
3114
0
                                                       (int16_t)(params->wmmat[0] >> trans_prec_diff));
3115
0
        svt_aom_wb_write_signed_primitive_refsubexpfin(wb,
3116
0
                                                       (1 << trans_bits) + 1,
3117
0
                                                       SUBEXPFIN_K,
3118
0
                                                       (int16_t)(ref_params->wmmat[1] >> trans_prec_diff),
3119
0
                                                       (int16_t)(params->wmmat[1] >> trans_prec_diff));
3120
0
    }
3121
0
}
3122
3123
static void write_global_motion(PictureParentControlSet* pcs, AomWriteBitBuffer* wb)
3124
3125
0
{
3126
0
    int32_t      frame;
3127
0
    FrameHeader* frm_hdr = &pcs->frm_hdr;
3128
0
    for (frame = LAST_FRAME; frame <= ALTREF_FRAME; ++frame) {
3129
0
        const WarpedMotionParams* ref_params = (frm_hdr->primary_ref_frame != PRIMARY_REF_NONE)
3130
0
            ? &pcs->child_pcs->ref_global_motion[frame]
3131
0
            : &default_warp_params;
3132
0
        write_global_motion_params(&pcs->global_motion[frame], ref_params, wb, frm_hdr->allow_high_precision_mv);
3133
        // The logic in the commented out code below
3134
        // does not work currently and causes mismatches when resize is on.
3135
        // Fix it before turning the optimization back on.
3136
        /*
3137
        Yv12BufferConfig *ref_buf = get_ref_frame_buffer(cpi, frame);
3138
        if (cpi->source->y_crop_width == ref_buf->y_crop_width &&
3139
        cpi->source->y_crop_height == ref_buf->y_crop_height) {
3140
        write_global_motion_params(&cm->global_motion[frame],
3141
        &cm->prev_frame->global_motion[frame], wb,
3142
        cm->allow_high_precision_mv);
3143
        } else {
3144
        assert(cm->global_motion[frame].wmtype == IDENTITY &&
3145
        "Invalid warp type for frames of different resolutions");
3146
        }
3147
        */
3148
        /*
3149
        SVT_LOG("Frame %d/%d: Enc Ref %d: %d %d %d %d\n",
3150
        cm->current_video_frame, cm->show_frame, frame,
3151
        cm->global_motion[frame].wmmat[0],
3152
        cm->global_motion[frame].wmmat[1], cm->global_motion[frame].wmmat[2],
3153
        cm->global_motion[frame].wmmat[3]);
3154
        */
3155
0
    }
3156
0
}
3157
3158
#if CONFIG_ENABLE_FILM_GRAIN
3159
0
static void write_film_grain_params(PictureParentControlSet* pcs, AomWriteBitBuffer* wb) {
3160
0
    FrameHeader*  frm_hdr = &pcs->frm_hdr;
3161
0
    AomFilmGrain* pars    = &frm_hdr->film_grain_params;
3162
3163
0
    svt_aom_wb_write_bit(wb, pars->apply_grain);
3164
0
    if (!pars->apply_grain) {
3165
0
        return;
3166
0
    }
3167
3168
0
    svt_aom_wb_write_literal(wb, pars->random_seed, 16);
3169
3170
0
    if (frm_hdr->frame_type == INTER_FRAME) {
3171
0
        EbReferenceObject* ref_obj_0 = (EbReferenceObject*)pcs->child_pcs->ref_pic_ptr_array[REF_LIST_0][0]->object_ptr;
3172
0
        int32_t            ref_idx   = 0;
3173
0
        pars->update_parameters      = 1;
3174
3175
0
        if (!pars->ignore_ref) {
3176
0
            if (svt_aom_film_grain_params_equal(&ref_obj_0->film_grain_params, pars)) {
3177
0
                pars->update_parameters = 0;
3178
0
                ref_idx                 = get_ref_frame_map_idx(pcs, LAST_FRAME);
3179
0
            } else if (pcs->child_pcs->slice_type == B_SLICE) {
3180
0
                EbReferenceObject* ref_obj_1 =
3181
0
                    (EbReferenceObject*)pcs->child_pcs->ref_pic_ptr_array[REF_LIST_1][0]->object_ptr;
3182
0
                if (svt_aom_film_grain_params_equal(&ref_obj_1->film_grain_params, pars)) {
3183
0
                    pars->update_parameters = 0;
3184
0
                    ref_idx = get_ref_frame_map_idx(pcs, ALTREF_FRAME); //todo: will it always be ALF_REF in L1?
3185
0
                }
3186
0
            }
3187
0
        }
3188
3189
0
        svt_aom_wb_write_bit(wb, pars->update_parameters);
3190
0
        if (!pars->update_parameters) {
3191
0
            svt_aom_wb_write_literal(wb, ref_idx, 3);
3192
0
            return;
3193
0
        }
3194
0
    } else {
3195
0
        pars->update_parameters = 1;
3196
0
    }
3197
3198
    // Scaling functions parameters
3199
0
    svt_aom_wb_write_literal(wb, pars->num_y_points, 4); // max 14
3200
0
    for (int32_t i = 0; i < pars->num_y_points; i++) {
3201
0
        svt_aom_wb_write_literal(wb, pars->scaling_points_y[i][0], 8);
3202
0
        svt_aom_wb_write_literal(wb, pars->scaling_points_y[i][1], 8);
3203
0
    }
3204
3205
0
    if (!pcs->scs->seq_header.color_config.mono_chrome) {
3206
0
        svt_aom_wb_write_bit(wb, pars->chroma_scaling_from_luma);
3207
0
    } else {
3208
0
        pars->chroma_scaling_from_luma = 0; // for monochrome override to 0
3209
0
    }
3210
3211
0
    if (pcs->scs->seq_header.color_config.mono_chrome || pars->chroma_scaling_from_luma ||
3212
        // todo: add corresponding check when subsampling variables are present
3213
0
        ((pcs->scs->subsampling_x == 1) && (pcs->scs->subsampling_y == 1) && (pars->num_y_points == 0))) {
3214
0
        pars->num_cb_points = 0;
3215
0
        pars->num_cr_points = 0;
3216
0
    } else {
3217
0
        svt_aom_wb_write_literal(wb, pars->num_cb_points, 4); // max 10
3218
0
        for (int32_t i = 0; i < pars->num_cb_points; i++) {
3219
0
            svt_aom_wb_write_literal(wb, pars->scaling_points_cb[i][0], 8);
3220
0
            svt_aom_wb_write_literal(wb, pars->scaling_points_cb[i][1], 8);
3221
0
        }
3222
3223
0
        svt_aom_wb_write_literal(wb, pars->num_cr_points, 4); // max 10
3224
0
        for (int32_t i = 0; i < pars->num_cr_points; i++) {
3225
0
            svt_aom_wb_write_literal(wb, pars->scaling_points_cr[i][0], 8);
3226
0
            svt_aom_wb_write_literal(wb, pars->scaling_points_cr[i][1], 8);
3227
0
        }
3228
0
    }
3229
3230
0
    svt_aom_wb_write_literal(wb, pars->scaling_shift - 8, 2); // 8 + value
3231
3232
    // AR coefficients
3233
    // Only sent if the corresponsing scaling function has
3234
    // more than 0 points
3235
3236
0
    svt_aom_wb_write_literal(wb, pars->ar_coeff_lag, 2);
3237
3238
0
    int32_t num_pos_luma   = 2 * pars->ar_coeff_lag * (pars->ar_coeff_lag + 1);
3239
0
    int32_t num_pos_chroma = num_pos_luma;
3240
0
    if (pars->num_y_points > 0) {
3241
0
        ++num_pos_chroma;
3242
0
    }
3243
3244
0
    if (pars->num_y_points) {
3245
0
        for (int32_t i = 0; i < num_pos_luma; i++) {
3246
0
            svt_aom_wb_write_literal(wb, pars->ar_coeffs_y[i] + 128, 8);
3247
0
        }
3248
0
    }
3249
3250
0
    if (pars->num_cb_points || pars->chroma_scaling_from_luma) {
3251
0
        for (int32_t i = 0; i < num_pos_chroma; i++) {
3252
0
            svt_aom_wb_write_literal(wb, pars->ar_coeffs_cb[i] + 128, 8);
3253
0
        }
3254
0
    }
3255
3256
0
    if (pars->num_cr_points || pars->chroma_scaling_from_luma) {
3257
0
        for (int32_t i = 0; i < num_pos_chroma; i++) {
3258
0
            svt_aom_wb_write_literal(wb, pars->ar_coeffs_cr[i] + 128, 8);
3259
0
        }
3260
0
    }
3261
3262
0
    svt_aom_wb_write_literal(wb, pars->ar_coeff_shift - 6, 2); // 8 + value
3263
3264
0
    svt_aom_wb_write_literal(wb, pars->grain_scale_shift, 2);
3265
3266
0
    if (pars->num_cb_points) {
3267
0
        svt_aom_wb_write_literal(wb, pars->cb_mult, 8);
3268
0
        svt_aom_wb_write_literal(wb, pars->cb_luma_mult, 8);
3269
0
        svt_aom_wb_write_literal(wb, pars->cb_offset, 9);
3270
0
    }
3271
3272
0
    if (pars->num_cr_points) {
3273
0
        svt_aom_wb_write_literal(wb, pars->cr_mult, 8);
3274
0
        svt_aom_wb_write_literal(wb, pars->cr_luma_mult, 8);
3275
0
        svt_aom_wb_write_literal(wb, pars->cr_offset, 9);
3276
0
    }
3277
3278
0
    svt_aom_wb_write_bit(wb, pars->overlap_flag);
3279
3280
0
    svt_aom_wb_write_bit(wb, pars->clip_to_restricted_range);
3281
0
}
3282
#endif
3283
3284
0
static uint32_t get_ref_order_hint(PictureParentControlSet* pcs, MvReferenceFrame ref_frame) {
3285
0
    int32_t ref_idx = get_ref_frame_map_idx(pcs, ref_frame);
3286
0
    if (ref_idx == INVALID_IDX) {
3287
0
        return INVALID_IDX;
3288
0
    }
3289
0
    return pcs->dpb_order_hint[ref_idx];
3290
0
}
3291
3292
0
static void write_frame_size_with_refs(PictureParentControlSet* pcs, AomWriteBitBuffer* wb) {
3293
#if DEBUG_SFRAME
3294
    fprintf(stderr,
3295
            "\nFrame %d, dpb buf order hint %u,%u,%u,%u,%u,%u,%u\n",
3296
            (int)pcs->picture_number,
3297
            get_ref_order_hint(pcs, LAST_FRAME),
3298
            get_ref_order_hint(pcs, LAST2_FRAME),
3299
            get_ref_order_hint(pcs, LAST3_FRAME),
3300
            get_ref_order_hint(pcs, GOLDEN_FRAME),
3301
            get_ref_order_hint(pcs, BWDREF_FRAME),
3302
            get_ref_order_hint(pcs, ALTREF2_FRAME),
3303
            get_ref_order_hint(pcs, ALTREF_FRAME));
3304
#endif
3305
0
    for (uint32_t ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
3306
0
        int32_t  found          = 0;
3307
0
        uint32_t ref_order_hint = get_ref_order_hint(pcs, ref_frame);
3308
0
        if ((int32_t)ref_order_hint != INVALID_IDX) {
3309
0
            for (uint8_t i = 0; i < pcs->ref_list0_count; ++i) {
3310
0
                EbReferenceObject* ref =
3311
0
                    (EbReferenceObject*)pcs->child_pcs->ref_pic_ptr_array[REF_LIST_0][i]->object_ptr;
3312
0
                if (ref->order_hint != ref_order_hint) {
3313
0
                    continue;
3314
0
                }
3315
                // Both super-res upscaled size and render size should be checked as per spec 5.9.7,
3316
                // but in current implementation, render_and_frame_size_different is fixed to 0, see
3317
                // function write_render_size()
3318
0
                found = pcs->enhanced_pic->width == ref->reference_picture->width &&
3319
0
                    pcs->enhanced_pic->height == ref->reference_picture->height;
3320
0
                if (found) {
3321
0
                    break;
3322
0
                }
3323
0
            }
3324
0
            if (!found) {
3325
0
                for (uint8_t i = 0; i < pcs->ref_list1_count; ++i) {
3326
0
                    EbReferenceObject* ref =
3327
0
                        (EbReferenceObject*)pcs->child_pcs->ref_pic_ptr_array[REF_LIST_1][i]->object_ptr;
3328
0
                    if (ref->order_hint != ref_order_hint) {
3329
0
                        continue;
3330
0
                    }
3331
0
                    found = pcs->enhanced_pic->width == ref->reference_picture->width &&
3332
0
                        pcs->enhanced_pic->height == ref->reference_picture->height;
3333
0
                    if (found) {
3334
0
                        break;
3335
0
                    }
3336
0
                }
3337
0
            }
3338
0
        }
3339
3340
0
        svt_aom_wb_write_bit(wb, found);
3341
0
        if (found) {
3342
0
            write_superres_scale(wb, pcs);
3343
0
            return;
3344
0
        }
3345
0
    }
3346
3347
    // not found
3348
0
    const int frame_size_override = 1; // Always equal to 1 in this function
3349
0
    write_frame_size(pcs, frame_size_override, wb);
3350
0
}
3351
3352
// New function based on HLS R18
3353
static void write_uncompressed_header_obu(SequenceControlSet* scs /*Av1Comp *cpi*/, PictureParentControlSet* pcs,
3354
860
                                          AomWriteBitBuffer* wb, uint8_t show_existing) {
3355
    // Av1Common *const cm = &cpi->common;
3356
    // MacroBlockD *const xd = &cpi->td.mb.e_mbd;
3357
860
    Av1Common* const cm       = pcs->av1_cm;
3358
860
    uint16_t         tile_cnt = cm->tiles_info.tile_rows * cm->tiles_info.tile_cols;
3359
3360
860
    FrameHeader* frm_hdr = &pcs->frm_hdr;
3361
860
    if (!scs->seq_header.reduced_still_picture_header) {
3362
0
        if (show_existing) {
3363
            //SVT_ERROR("show_existing_frame not supported yet\n");
3364
            //RefCntBuffer *const frame_bufs = cm->buffer_pool->frame_bufs;
3365
            //const int32_t frame_to_show = cm->ref_frame_map[cpi->show_existing_frame];
3366
3367
            //if (frame_to_show < 0 || frame_bufs[frame_to_show].ref_count < 1) {
3368
            //    aom_internal_error(&cm->error, SVT_AOM_CODEC_UNSUP_BITSTREAM,
3369
            //        "Buffer %d does not contain a reconstructed frame",
3370
            //        frame_to_show);
3371
            //}
3372
            //ref_cnt_fb(frame_bufs, &cm->new_fb_idx, frame_to_show);
3373
3374
0
            svt_aom_wb_write_bit(wb, 1); // show_existing_frame
3375
0
            svt_aom_wb_write_literal(wb, frm_hdr->show_existing_frame, 3);
3376
0
            if (scs->seq_header.frame_id_numbers_present_flag) {
3377
0
                SVT_ERROR("frame_id_numbers_present_flag not supported yet\n");
3378
                /*int32_t frame_id_len = cm->seq_params.frame_id_length;
3379
                int32_t display_frame_id = cm->ref_frame_id[cpi->show_existing_frame];
3380
                svt_aom_wb_write_literal(wb, display_frame_id, frame_id_len);*/
3381
0
            }
3382
3383
            //        if (cm->reset_decoder_state &&
3384
            //            frame_bufs[frame_to_show].frame_type != KEY_FRAME) {
3385
            //            aom_internal_error(
3386
            //                &cm->error, SVT_AOM_CODEC_UNSUP_BITSTREAM,
3387
            //                "show_existing_frame to reset state on KEY_FRAME only");
3388
            //        }
3389
3390
0
            return;
3391
0
        } else {
3392
0
            svt_aom_wb_write_bit(wb, 0); // show_existing_frame
3393
0
        }
3394
3395
0
        svt_aom_wb_write_literal(wb, frm_hdr->frame_type, 2);
3396
3397
0
        svt_aom_wb_write_bit(wb, frm_hdr->show_frame);
3398
3399
0
        if (!frm_hdr->show_frame) {
3400
0
            svt_aom_wb_write_bit(wb, frm_hdr->showable_frame);
3401
0
        }
3402
0
        if (frm_hdr->frame_type == S_FRAME) {
3403
0
            assert(frm_hdr->error_resilient_mode);
3404
0
        } else if (!(frm_hdr->frame_type == KEY_FRAME && frm_hdr->show_frame)) {
3405
0
            svt_aom_wb_write_bit(wb, frm_hdr->error_resilient_mode);
3406
0
        }
3407
0
    }
3408
3409
860
    svt_aom_wb_write_bit(wb, frm_hdr->disable_cdf_update);
3410
3411
860
    if (scs->seq_header.seq_force_screen_content_tools == 2) {
3412
860
        svt_aom_wb_write_bit(wb, frm_hdr->allow_screen_content_tools);
3413
860
    } else {
3414
0
        assert(frm_hdr->allow_screen_content_tools == scs->seq_header.seq_force_screen_content_tools);
3415
0
    }
3416
3417
860
    if (frm_hdr->allow_screen_content_tools) {
3418
0
        if (scs->seq_header.seq_force_integer_mv == 2) {
3419
0
            svt_aom_wb_write_bit(wb, frm_hdr->force_integer_mv);
3420
0
        } else {
3421
0
            assert(frm_hdr->force_integer_mv == scs->seq_header.seq_force_integer_mv);
3422
0
        }
3423
860
    } else {
3424
860
        assert(frm_hdr->force_integer_mv == 0);
3425
860
    }
3426
3427
860
    const int32_t frame_size_override_flag = frame_is_sframe(pcs) || pcs->frame_resize_enabled
3428
860
        ? 1
3429
860
        : ((pcs->av1_cm->frm_size.superres_upscaled_width != scs->seq_header.max_frame_width) ||
3430
860
           (pcs->av1_cm->frm_size.superres_upscaled_height != scs->seq_header.max_frame_height));
3431
3432
860
    if (!scs->seq_header.reduced_still_picture_header) {
3433
0
        if (scs->seq_header.frame_id_numbers_present_flag) {
3434
0
            int32_t frame_id_len = scs->seq_header.frame_id_length;
3435
0
            svt_aom_wb_write_literal(wb, frm_hdr->current_frame_id, frame_id_len);
3436
0
        }
3437
3438
        //if (cm->width > cm->seq_params.max_frame_width ||
3439
        //    cm->height > cm->seq_params.max_frame_height) {
3440
        //    aom_internal_error(&cm->error, SVT_AOM_CODEC_UNSUP_BITSTREAM,
3441
        //        "Frame dimensions are larger than the maximum values");
3442
        //}
3443
3444
0
        if (!frame_is_sframe(pcs)) {
3445
0
            svt_aom_wb_write_bit(wb, frame_size_override_flag);
3446
0
        }
3447
3448
0
        if (scs->seq_header.order_hint_info.enable_order_hint) {
3449
0
            svt_aom_wb_write_literal(wb, (int32_t)pcs->frame_offset, scs->seq_header.order_hint_info.order_hint_bits);
3450
0
        }
3451
3452
0
        if (!frm_hdr->error_resilient_mode && !frame_is_intra_only(pcs)) {
3453
0
            svt_aom_wb_write_literal(wb, frm_hdr->primary_ref_frame, PRIMARY_REF_BITS);
3454
0
        }
3455
860
    } else { // reduced_still_picture_header
3456
860
        assert(frame_size_override_flag == 0);
3457
860
    }
3458
860
    if (frm_hdr->frame_type == KEY_FRAME) {
3459
860
        if (!frm_hdr->show_frame) {
3460
0
            svt_aom_wb_write_literal(wb, pcs->av1_ref_signal.refresh_frame_mask, REF_FRAMES);
3461
0
        }
3462
860
    } else {
3463
0
        if (frm_hdr->frame_type == INTRA_ONLY_FRAME) {
3464
            // pcs->refresh_frame_mask = get_refresh_mask(cpi);
3465
0
            int32_t updated_fb = -1;
3466
0
            for (int32_t i = 0; i < REF_FRAMES; i++) {
3467
                // If more than one frame is refreshed, it doesn't matter which one
3468
                // we pick, so pick the first.
3469
0
                if (pcs->av1_ref_signal.refresh_frame_mask & (1 << i)) {
3470
0
                    updated_fb = i;
3471
0
                    break;
3472
0
                }
3473
0
            }
3474
0
            assert(updated_fb >= 0);
3475
0
            pcs->fb_of_context_type[pcs->frame_context_idx] = updated_fb;
3476
3477
0
            svt_aom_wb_write_literal(wb, pcs->av1_ref_signal.refresh_frame_mask, REF_FRAMES);
3478
0
        } else if (frm_hdr->frame_type == INTER_FRAME || frame_is_sframe(pcs)) {
3479
            //pcs->refresh_frame_mask = get_refresh_mask(cpi);
3480
0
            if (frm_hdr->frame_type == INTER_FRAME) {
3481
0
                svt_aom_wb_write_literal(wb, pcs->av1_ref_signal.refresh_frame_mask, REF_FRAMES);
3482
0
            } else {
3483
0
                assert(frame_is_sframe(pcs) && pcs->av1_ref_signal.refresh_frame_mask == 0xFF);
3484
0
            }
3485
3486
            // write ref order hint map into bitstream
3487
0
            if (pcs->frm_hdr.error_resilient_mode && scs->seq_header.order_hint_info.enable_order_hint) {
3488
0
                for (int32_t ref_idx = 0; ref_idx < REF_FRAMES; ref_idx++) {
3489
0
                    svt_aom_wb_write_literal(
3490
0
                        wb, pcs->dpb_order_hint[ref_idx], scs->seq_header.order_hint_info.order_hint_bits);
3491
0
                }
3492
0
            }
3493
3494
0
            int32_t updated_fb = -1;
3495
0
            for (int32_t i = 0; i < REF_FRAMES; i++) {
3496
                // If more than one frame is refreshed, it doesn't matter which one
3497
                // we pick, so pick the first.
3498
0
                if (pcs->av1_ref_signal.refresh_frame_mask & (1 << i)) {
3499
0
                    updated_fb = i;
3500
0
                    break;
3501
0
                }
3502
0
            }
3503
            // large scale tile sometimes won't refresh any fbs
3504
0
            if (updated_fb >= 0) {
3505
0
                pcs->fb_of_context_type[pcs->frame_context_idx] = updated_fb;
3506
0
            }
3507
0
        }
3508
0
    }
3509
3510
#if DEBUG_SFRAME
3511
    {
3512
        uint32_t* _ref_frame_map = pcs->dpb_order_hint;
3513
        fprintf(stderr,
3514
                "\nFrame %d, use_ref_frame_mvs %u, ref_order_hint_map %d,%d,%d,%d,%d,%d,%d,%d\n",
3515
                (int)pcs->picture_number,
3516
                frm_hdr->use_ref_frame_mvs,
3517
                _ref_frame_map[0],
3518
                _ref_frame_map[1],
3519
                _ref_frame_map[2],
3520
                _ref_frame_map[3],
3521
                _ref_frame_map[4],
3522
                _ref_frame_map[5],
3523
                _ref_frame_map[6],
3524
                _ref_frame_map[7]);
3525
    }
3526
#endif
3527
3528
860
    if (frm_hdr->frame_type == KEY_FRAME) {
3529
860
        write_frame_size(pcs, frame_size_override_flag, wb);
3530
860
        assert(av1_superres_unscaled(&(pcs->av1_cm->frm_size)) || !(frm_hdr->allow_intrabc));
3531
860
        if (frm_hdr->allow_screen_content_tools && av1_superres_unscaled(&(pcs->av1_cm->frm_size))) {
3532
0
            svt_aom_wb_write_bit(wb, frm_hdr->allow_intrabc);
3533
0
        }
3534
        // all eight fbs are refreshed, pick one that will live long enough
3535
860
        pcs->fb_of_context_type[REGULAR_FRAME] = 0;
3536
860
    } else {
3537
0
        if (frm_hdr->frame_type == INTRA_ONLY_FRAME) {
3538
0
            write_frame_size(pcs, frame_size_override_flag, wb);
3539
0
            assert(av1_superres_unscaled(&(pcs->av1_cm->frm_size)) || !(frm_hdr->allow_intrabc));
3540
0
            if (frm_hdr->allow_screen_content_tools && av1_superres_unscaled(&(pcs->av1_cm->frm_size))) {
3541
0
                svt_aom_wb_write_bit(wb, frm_hdr->allow_intrabc);
3542
0
            }
3543
0
        } else if (frm_hdr->frame_type == INTER_FRAME || frame_is_sframe(pcs)) {
3544
0
            MvReferenceFrame ref_frame;
3545
3546
0
            assert(frm_hdr->frame_refs_short_signaling == 0);
3547
            // NOTE: Error resilient mode turns off frame_refs_short_signaling
3548
            //       automatically.
3549
0
            if (scs->seq_header.order_hint_info.enable_order_hint) {
3550
0
                svt_aom_wb_write_bit(wb, frm_hdr->frame_refs_short_signaling);
3551
0
            }
3552
3553
0
            if (frm_hdr->frame_refs_short_signaling) {
3554
0
                svt_aom_wb_write_literal(wb, get_ref_frame_map_idx(pcs, LAST_FRAME), REF_FRAMES_LOG2);
3555
0
                svt_aom_wb_write_literal(wb, get_ref_frame_map_idx(pcs, GOLDEN_FRAME), REF_FRAMES_LOG2);
3556
0
            }
3557
0
            for (ref_frame = LAST_FRAME; ref_frame <= ALTREF_FRAME; ++ref_frame) {
3558
0
                assert(get_ref_frame_map_idx(pcs, ref_frame) != INVALID_IDX);
3559
0
                if (!frm_hdr->frame_refs_short_signaling) {
3560
0
                    svt_aom_wb_write_literal(wb, get_ref_frame_map_idx(pcs, ref_frame), REF_FRAMES_LOG2);
3561
0
                }
3562
3563
0
                if (scs->seq_header.frame_id_numbers_present_flag) {
3564
0
                    SVT_ERROR("frame_id_numbers_present_flag not supported yet\n");
3565
                    //int32_t i = get_ref_frame_map_idx(cpi, ref_frame);
3566
                    //int32_t frame_id_len = cm->seq_params.frame_id_length;
3567
                    //int32_t diff_len = cm->seq_params.delta_frame_id_length;
3568
                    //int32_t delta_frame_id_minus1 =
3569
                    //    ((cm->current_frame_id - cm->ref_frame_id[i] +
3570
                    //    (1 << frame_id_len)) %
3571
                    //    (1 << frame_id_len)) -
3572
                    //    1;
3573
                    //if (delta_frame_id_minus1 < 0 ||
3574
                    //    delta_frame_id_minus1 >= (1 << diff_len))
3575
                    //    cm->invalid_delta_frame_id_minus1 = 1;
3576
                    //svt_aom_wb_write_literal(wb, delta_frame_id_minus1, diff_len);
3577
0
                }
3578
0
            }
3579
3580
0
            if (!pcs->frm_hdr.error_resilient_mode && frame_size_override_flag) {
3581
0
                write_frame_size_with_refs(pcs, wb);
3582
0
            } else {
3583
0
                write_frame_size(pcs, frame_size_override_flag, wb);
3584
0
            }
3585
3586
0
            if (frm_hdr->force_integer_mv) {
3587
0
                frm_hdr->allow_high_precision_mv = 0;
3588
0
            } else {
3589
0
                svt_aom_wb_write_bit(wb, frm_hdr->allow_high_precision_mv);
3590
0
            }
3591
0
#define LOG_SWITCHABLE_FILTERS 2
3592
3593
0
            svt_aom_wb_write_bit(wb, pcs->frm_hdr.interpolation_filter == SWITCHABLE);
3594
0
            if (pcs->frm_hdr.interpolation_filter != SWITCHABLE) {
3595
0
                svt_aom_wb_write_literal(wb, pcs->frm_hdr.interpolation_filter, LOG_SWITCHABLE_FILTERS);
3596
0
            }
3597
3598
0
            svt_aom_wb_write_bit(wb, frm_hdr->is_motion_mode_switchable);
3599
0
            if (frame_might_allow_ref_frame_mvs(pcs, scs)) {
3600
0
                svt_aom_wb_write_bit(wb, frm_hdr->use_ref_frame_mvs);
3601
0
            }
3602
0
        }
3603
0
    }
3604
3605
    //if (scs->frame_id_numbers_present_flag)
3606
    //    pcs->refresh_mask = get_refresh_mask(pcs);
3607
860
    const int32_t might_bwd_adapt = !(scs->seq_header.reduced_still_picture_header) && !(frm_hdr->disable_cdf_update);
3608
860
    if (pcs->large_scale_tile) {
3609
0
        pcs->refresh_frame_context = REFRESH_FRAME_CONTEXT_DISABLED;
3610
0
    }
3611
860
    if (might_bwd_adapt) {
3612
0
        svt_aom_wb_write_bit(wb, pcs->refresh_frame_context == REFRESH_FRAME_CONTEXT_DISABLED);
3613
0
    }
3614
3615
860
    write_tile_info(pcs, /*saved_wb,*/ wb);
3616
3617
860
    encode_quantization(pcs, wb);
3618
860
    encode_segmentation(pcs, wb);
3619
    //svt_aom_wb_write_bit(wb, 0);
3620
    //encode_segmentation(cm, xd, wb);
3621
    //if (pcs->delta_q_present_flag)
3622
    // assert(delta_q_allowed == 1 && frm_hdr->quantisation_params.base_q_idx > 0);
3623
3624
860
    if (frm_hdr->quantization_params.base_q_idx > 0) {
3625
490
        svt_aom_wb_write_bit(wb, frm_hdr->delta_q_params.delta_q_present);
3626
490
        if (frm_hdr->delta_q_params.delta_q_present) {
3627
0
            svt_aom_wb_write_literal(wb, svt_log2f_safe(frm_hdr->delta_q_params.delta_q_res), 2);
3628
0
            for (uint16_t tile_idx = 0; tile_idx < tile_cnt; tile_idx++) {
3629
0
                pcs->prev_qindex[tile_idx] = frm_hdr->quantization_params.base_q_idx;
3630
0
            }
3631
0
            if (frm_hdr->allow_intrabc) {
3632
0
                assert(frm_hdr->delta_lf_params.delta_lf_present == 0);
3633
0
            } else {
3634
0
                svt_aom_wb_write_bit(wb, frm_hdr->delta_lf_params.delta_lf_present);
3635
0
            }
3636
0
            if (frm_hdr->delta_lf_params.delta_lf_present) {
3637
0
                svt_aom_wb_write_literal(wb, svt_log2f_safe(frm_hdr->delta_lf_params.delta_lf_res), 2);
3638
0
                pcs->prev_delta_lf_from_base = 0;
3639
0
                svt_aom_wb_write_bit(wb, frm_hdr->delta_lf_params.delta_lf_multi);
3640
0
                const int32_t frame_lf_count = pcs->monochrome == 0 ? FRAME_LF_COUNT : FRAME_LF_COUNT - 2;
3641
0
                for (int32_t lf_id = 0; lf_id < frame_lf_count; ++lf_id) {
3642
0
                    pcs->prev_delta_lf[lf_id] = 0;
3643
0
                }
3644
0
            }
3645
0
        }
3646
490
    }
3647
3648
860
    if (frm_hdr->all_lossless) {
3649
370
        assert(av1_superres_unscaled(&(pcs->av1_cm->frm_size)));
3650
490
    } else {
3651
490
        if (!frm_hdr->coded_lossless) {
3652
490
            encode_loopfilter(pcs, wb);
3653
490
            if (scs->seq_header.cdef_level) {
3654
490
                encode_cdef(pcs, wb);
3655
490
            }
3656
490
        }
3657
3658
490
        if (scs->seq_header.enable_restoration) {
3659
0
            encode_restoration_mode(pcs, wb);
3660
0
        }
3661
490
    }
3662
860
    if (frm_hdr->coded_lossless) {
3663
370
        assert(1); // assert(frm_hdr->tx_mode == ONLY_4X4);
3664
490
    } else {
3665
490
        svt_aom_wb_write_bit(wb, frm_hdr->tx_mode == TX_MODE_SELECT);
3666
490
    }
3667
    //write_tx_mode(cm, &pcs->tx_mode, wb);
3668
3669
860
    if (pcs->allow_comp_inter_inter) {
3670
0
        const int32_t use_hybrid_pred = frm_hdr->reference_mode == REFERENCE_MODE_SELECT;
3671
3672
0
        svt_aom_wb_write_bit(wb, use_hybrid_pred);
3673
0
    }
3674
3675
860
    if (frm_hdr->skip_mode_params.skip_mode_allowed) {
3676
0
        svt_aom_wb_write_bit(wb, frm_hdr->skip_mode_params.skip_mode_flag);
3677
0
    }
3678
3679
860
    if (frame_might_allow_warped_motion(pcs, scs)) {
3680
0
        svt_aom_wb_write_bit(wb, frm_hdr->allow_warped_motion);
3681
860
    } else {
3682
860
        assert(!frm_hdr->allow_warped_motion);
3683
860
    }
3684
3685
860
    svt_aom_wb_write_bit(wb, frm_hdr->reduced_tx_set);
3686
3687
860
    if (!frame_is_intra_only(pcs)) {
3688
        //  SVT_ERROR("Global motion not supported yet\n");
3689
0
        write_global_motion(pcs, wb);
3690
0
    }
3691
860
#if CONFIG_ENABLE_FILM_GRAIN
3692
860
    if (scs->seq_header.film_grain_params_present && (frm_hdr->show_frame || frm_hdr->showable_frame)) {
3693
0
        write_film_grain_params(pcs, wb);
3694
0
    }
3695
860
#endif
3696
860
}
3697
3698
1.29k
static uint32_t write_obu_header(ObuType obu_type, int32_t obuExtension, uint8_t* const dst) {
3699
1.29k
    AomWriteBitBuffer wb   = {dst, 0};
3700
1.29k
    uint32_t          size = 0;
3701
3702
1.29k
    svt_aom_wb_write_literal(&wb, 0, 1); // forbidden bit.
3703
1.29k
    svt_aom_wb_write_literal(&wb, (int32_t)obu_type, 4);
3704
1.29k
    svt_aom_wb_write_literal(&wb, obuExtension ? 1 : 0, 1);
3705
1.29k
    svt_aom_wb_write_literal(&wb, 1, 1); // obu_has_payload_length_field
3706
1.29k
    svt_aom_wb_write_literal(&wb, 0, 1); // reserved
3707
3708
1.29k
    if (obuExtension) {
3709
0
        svt_aom_wb_write_literal(&wb, obuExtension & 0xFF, 8);
3710
0
    }
3711
1.29k
    size = svt_aom_wb_bytes_written(&wb);
3712
1.29k
    return size;
3713
1.29k
}
3714
3715
430
static int32_t write_uleb_obu_size(uint32_t obu_header_size, uint32_t obu_payload_size, uint8_t* dest) {
3716
430
    const uint32_t obu_size       = obu_payload_size;
3717
430
    const uint32_t offset         = obu_header_size;
3718
430
    size_t         coded_obu_size = 0;
3719
3720
430
    if (svt_aom_uleb_encode(obu_size, sizeof(obu_size), dest + offset, &coded_obu_size) != 0) {
3721
0
        return SVT_AOM_CODEC_ERROR;
3722
0
    }
3723
3724
430
    return SVT_AOM_CODEC_OK;
3725
430
}
3726
3727
860
static void add_trailing_bits(AomWriteBitBuffer* wb) {
3728
860
    if (svt_aom_wb_is_byte_aligned(wb)) {
3729
424
        svt_aom_wb_write_literal(wb, 0x80, 8);
3730
436
    } else {
3731
        // assumes that the other bits are already 0s
3732
436
        svt_aom_wb_write_bit(wb, 1);
3733
436
    }
3734
860
}
3735
3736
// writes the type and payload of the provided metadata to the address dst as a metadata OBU
3737
0
static uint32_t write_obu_metadata(SvtMetadataT* metadata, uint8_t* const dst) {
3738
0
    if (!metadata || !metadata->payload) {
3739
0
        return 0;
3740
0
    }
3741
0
    AomWriteBitBuffer wb   = {dst, 0};
3742
0
    uint32_t          size = 0;
3743
0
    svt_aom_wb_write_literal(&wb, metadata->type, 8);
3744
0
    for (size_t i = 0; i < metadata->sz; ++i) {
3745
0
        svt_aom_wb_write_literal(&wb, metadata->payload[i], 8);
3746
0
    }
3747
0
    add_trailing_bits(&wb);
3748
0
    size = svt_aom_wb_bytes_written(&wb);
3749
0
    return size;
3750
0
}
3751
3752
860
static void write_bitstream_level(BitstreamLevel bl, AomWriteBitBuffer* wb) {
3753
860
    uint8_t seq_level_idx = major_minor_to_seq_level_idx(bl);
3754
860
    assert(is_valid_seq_level_idx(seq_level_idx));
3755
860
    svt_aom_wb_write_literal(wb, seq_level_idx, LEVEL_BITS);
3756
860
}
3757
3758
860
static uint32_t write_sequence_header_obu(SequenceControlSet* scs, uint8_t* const dst, uint8_t numberSpatialLayers) {
3759
860
    AomWriteBitBuffer wb   = {dst, 0};
3760
860
    uint32_t          size = 0;
3761
3762
860
    set_bitstream_level_tier(scs);
3763
3764
860
    write_profile((BitstreamProfile)scs->static_config.profile, &wb);
3765
3766
    // Still picture or not
3767
860
    svt_aom_wb_write_bit(&wb, scs->seq_header.still_picture);
3768
860
    assert(IMPLIES(!scs->seq_header.still_picture, !scs->seq_header.reduced_still_picture_header));
3769
3770
    // whether to use reduced still picture header
3771
860
    svt_aom_wb_write_bit(&wb, scs->seq_header.reduced_still_picture_header);
3772
3773
860
    if (scs->seq_header.reduced_still_picture_header) {
3774
860
        write_bitstream_level(scs->level[0], &wb);
3775
860
    } else {
3776
0
        svt_aom_wb_write_bit(&wb, scs->seq_header.timing_info.timing_info_present); // timing info present flag
3777
3778
0
        if (scs->seq_header.timing_info.timing_info_present) {
3779
            // timing_info
3780
0
            SVT_ERROR("timing_info_present not supported\n");
3781
            /*write_timing_info_header(cm, &wb);
3782
            svt_aom_wb_write_bit(&wb, cm->decoder_model_info_present_flag);
3783
            if (cm->decoder_model_info_present_flag) write_decoder_model_info(cm, &wb);*/
3784
0
        }
3785
0
        svt_aom_wb_write_bit(&wb, scs->seq_header.initial_display_delay_present_flag);
3786
3787
0
        uint8_t operating_points_cnt_minus_1 = numberSpatialLayers > 1 ? numberSpatialLayers - 1 : 0;
3788
0
        svt_aom_wb_write_literal(&wb, operating_points_cnt_minus_1, OP_POINTS_CNT_MINUS_1_BITS);
3789
0
        int32_t i;
3790
0
        for (i = 0; i < operating_points_cnt_minus_1 + 1; i++) {
3791
0
            svt_aom_wb_write_literal(&wb, scs->seq_header.operating_point[i].op_idc, OP_POINTS_IDC_BITS);
3792
0
            write_bitstream_level(scs->level[i], &wb);
3793
0
            if (scs->level[i].major > 3) {
3794
0
                svt_aom_wb_write_bit(&wb, scs->seq_header.operating_point[i].seq_tier);
3795
0
            }
3796
0
            if (scs->seq_header.decoder_model_info_present_flag) {
3797
0
                SVT_ERROR("decoder_model_info_present_flag not supported\n");
3798
                //svt_aom_wb_write_bit(&wb,
3799
                //    cm->op_params[i].decoder_model_param_present_flag);
3800
                //if (cm->op_params[i].decoder_model_param_present_flag)
3801
                //    write_dec_model_op_parameters(cm, &wb, i);
3802
0
            }
3803
0
            if (scs->seq_header.initial_display_delay_present_flag) {
3804
0
                svt_aom_wb_write_bit(&wb, scs->seq_header.operating_point[i].initial_display_delay_present_for_this_op);
3805
0
                if (scs->seq_header.operating_point[i].initial_display_delay_present_for_this_op) {
3806
0
                    assert(scs->seq_header.operating_point[i].initial_display_delay <= 10);
3807
0
                    svt_aom_wb_write_literal(&wb, scs->seq_header.operating_point[i].initial_display_delay - 1, 4);
3808
0
                }
3809
0
            }
3810
0
        }
3811
0
    }
3812
860
    write_sequence_header(scs, &wb);
3813
3814
860
    write_color_config(scs, &wb);
3815
3816
860
    svt_aom_wb_write_bit(&wb, scs->seq_header.film_grain_params_present);
3817
3818
860
    add_trailing_bits(&wb);
3819
3820
860
    size = svt_aom_wb_bytes_written(&wb);
3821
860
    return size;
3822
860
}
3823
3824
static uint32_t write_tile_group_header(uint8_t* const dst, int startTile, int endTile, int tiles_log2,
3825
860
                                        int tile_start_and_end_present_flag) {
3826
860
    AomWriteBitBuffer wb   = {dst, 0};
3827
860
    uint32_t          size = 0;
3828
3829
860
    if (!tiles_log2) {
3830
10
        return size;
3831
10
    }
3832
850
    svt_aom_wb_write_bit(&wb, tile_start_and_end_present_flag);
3833
3834
850
    if (tile_start_and_end_present_flag) {
3835
0
        svt_aom_wb_write_literal(&wb, startTile, tiles_log2);
3836
0
        svt_aom_wb_write_literal(&wb, endTile, tiles_log2);
3837
0
    }
3838
3839
850
    size = svt_aom_wb_bytes_written(&wb);
3840
850
    return size;
3841
860
}
3842
3843
static uint32_t write_frame_header_obu(SequenceControlSet* scs, PictureParentControlSet* pcs, uint8_t* const dst,
3844
860
                                       uint8_t show_existing, int32_t appendTrailingBits) {
3845
860
    AomWriteBitBuffer wb         = {dst, 0};
3846
860
    uint32_t          total_size = 0;
3847
3848
860
    write_uncompressed_header_obu(scs, pcs, /* saved_wb,*/ &wb, show_existing);
3849
3850
860
    if (appendTrailingBits) {
3851
0
        add_trailing_bits(&wb);
3852
0
    }
3853
3854
860
    if (show_existing) {
3855
0
        total_size = svt_aom_wb_bytes_written(&wb);
3856
0
        return total_size;
3857
0
    }
3858
3859
860
    total_size = svt_aom_wb_bytes_written(&wb);
3860
860
    return total_size;
3861
860
}
3862
3863
EbErrorType svt_aom_write_metadata_av1(Bitstream* bitstream_ptr, SvtMetadataArrayT* metadata,
3864
1.29k
                                       const EbAv1MetadataType type) {
3865
1.29k
    EbErrorType return_error = EB_ErrorNone;
3866
1.29k
    if (!metadata || !metadata->metadata_array) {
3867
1.29k
        return EB_ErrorBadParameter;
3868
1.29k
    }
3869
3870
0
    OutputBitstreamUnit* output_bitstream_ptr = (OutputBitstreamUnit*)bitstream_ptr->output_bitstream_ptr;
3871
0
    uint8_t*             data                 = output_bitstream_ptr->buffer_av1;
3872
3873
0
    for (size_t i = 0; i < metadata->sz; i++) {
3874
0
        SvtMetadataT* current_metadata = metadata->metadata_array[i];
3875
0
        if (current_metadata && current_metadata->payload && current_metadata->type == type) {
3876
            // Phase 1: measure header + payload sizes
3877
0
            uint32_t obu_header_size   = write_obu_header(OBU_METADATA, 0, data);
3878
0
            uint32_t obu_payload_size  = write_obu_metadata(current_metadata, data + obu_header_size);
3879
0
            size_t   length_field_size = svt_aom_uleb_size_in_bytes(obu_payload_size);
3880
3881
            // Phase 2: write at correct offsets (re-write payload after LEB128)
3882
            // OBU header already at data[0]
3883
0
            size_t  coded_size;
3884
0
            int32_t ret = svt_aom_uleb_encode(
3885
0
                obu_payload_size, sizeof(obu_payload_size), data + obu_header_size, &coded_size);
3886
0
            assert(ret == 0 && coded_size == length_field_size);
3887
0
            if (ret != 0 || coded_size != length_field_size) {
3888
0
                return EB_ErrorBadParameter;
3889
0
            }
3890
0
            write_obu_metadata(current_metadata, data + obu_header_size + length_field_size);
3891
3892
0
            data += obu_header_size + length_field_size + obu_payload_size;
3893
0
        }
3894
0
    }
3895
0
    output_bitstream_ptr->buffer_av1 = data;
3896
0
    return return_error;
3897
0
}
3898
3899
/**************************************************
3900
* EncodeFrameHeaderHeader
3901
**************************************************/
3902
EbErrorType svt_aom_write_frame_header_av1(Bitstream* bitstream_ptr, SequenceControlSet* scs, PictureControlSet* pcs,
3903
430
                                           uint8_t show_existing) {
3904
430
    EbErrorType              return_error         = EB_ErrorNone;
3905
430
    OutputBitstreamUnit*     output_bitstream_ptr = (OutputBitstreamUnit*)bitstream_ptr->output_bitstream_ptr;
3906
430
    PictureParentControlSet* ppcs                 = pcs->ppcs;
3907
430
    Av1Common* const         cm                   = ppcs->av1_cm;
3908
430
    uint16_t                 tile_cnt             = cm->tiles_info.tile_rows * cm->tiles_info.tile_cols;
3909
430
    uint8_t*                 data                 = output_bitstream_ptr->buffer_av1;
3910
3911
430
    ObuType obu_type                        = show_existing ? OBU_FRAME_HEADER : OBU_FRAME;
3912
430
    int     n_log2_tiles                    = ppcs->av1_cm->log2_tile_rows + ppcs->av1_cm->log2_tile_cols;
3913
430
    int     tile_start_and_end_present_flag = 0;
3914
3915
    // Phase 1: Measure header sizes by writing to data (will be overwritten in phase 2).
3916
430
    uint32_t obu_header_size = write_obu_header(obu_type, 0, data);
3917
430
    uint32_t frame_hdr_size  = write_frame_header_obu(scs, ppcs, data + obu_header_size, show_existing, show_existing);
3918
430
    uint32_t tg_hdr_size     = write_tile_group_header(
3919
430
        data + obu_header_size + frame_hdr_size, 0, 0, n_log2_tiles, tile_start_and_end_present_flag);
3920
430
    uint32_t hdr_payload_size = frame_hdr_size + tg_hdr_size;
3921
3922
    // Compute tile data size (tile size prefixes + tile data).
3923
430
    uint32_t tile_data_size = 0;
3924
430
    if (!show_existing) {
3925
4.96k
        for (int tile_idx = 0; tile_idx < tile_cnt; tile_idx++) {
3926
4.53k
            tile_data_size += pcs->ec_info[tile_idx]->ec->ec_writer.pos;
3927
4.53k
            if (tile_idx != tile_cnt - 1 && tile_cnt > 1) {
3928
4.10k
                tile_data_size += pcs->tile_size_bytes_minus_1 + 1;
3929
4.10k
            }
3930
4.53k
        }
3931
430
    }
3932
3933
    // Compute exact OBU payload size and LEB128 field size.
3934
430
    uint32_t obu_payload_size  = hdr_payload_size + tile_data_size;
3935
430
    size_t   length_field_size = svt_aom_uleb_size_in_bytes(obu_payload_size);
3936
3937
    // Ensure buffer is large enough for the complete OBU.
3938
430
    uint32_t total_obu_size = obu_header_size + (uint32_t)length_field_size + obu_payload_size;
3939
430
    uint32_t buf_needed     = total_obu_size +
3940
430
        (uint32_t)(output_bitstream_ptr->buffer_av1 - output_bitstream_ptr->buffer_begin_av1);
3941
430
    if (output_bitstream_ptr->size < buf_needed) {
3942
0
        svt_realloc_output_bitstream_unit(output_bitstream_ptr, buf_needed + 1);
3943
0
        data = output_bitstream_ptr->buffer_av1;
3944
0
    }
3945
3946
    // Phase 2: Write everything at the correct offsets — no memmove needed.
3947
    // OBU header is already at data[0] from phase 1 (same content, same position).
3948
3949
    // LEB128 size field right after OBU header.
3950
430
    size_t coded_size;
3951
430
    svt_aom_uleb_encode(obu_payload_size, sizeof(obu_payload_size), data + obu_header_size, &coded_size);
3952
3953
    // Re-write frame header + tile group header at the correct offset (after LEB128).
3954
430
    uint32_t write_offset = obu_header_size + (uint32_t)length_field_size;
3955
430
    write_frame_header_obu(scs, ppcs, data + write_offset, show_existing, show_existing);
3956
430
    write_offset += frame_hdr_size;
3957
430
    write_tile_group_header(data + write_offset, 0, 0, n_log2_tiles, tile_start_and_end_present_flag);
3958
430
    write_offset += tg_hdr_size;
3959
3960
    // Copy tile data.
3961
430
    if (!show_existing) {
3962
4.96k
        for (int tile_idx = 0; tile_idx < tile_cnt; tile_idx++) {
3963
4.53k
            int32_t tile_size       = pcs->ec_info[tile_idx]->ec->ec_writer.pos;
3964
4.53k
            uint8_t tile_size_bytes = 0;
3965
4.53k
            if (tile_idx != tile_cnt - 1 && tile_cnt > 1) {
3966
4.10k
                tile_size_bytes = pcs->tile_size_bytes_minus_1 + 1;
3967
4.10k
                mem_put_varsize(data + write_offset, tile_size_bytes, tile_size - 1);
3968
4.10k
            }
3969
4.53k
            OutputBitstreamUnit* ec_output_bitstream_ptr =
3970
4.53k
                (OutputBitstreamUnit*)pcs->ec_info[tile_idx]->ec->ec_output_bitstream_ptr;
3971
4.53k
            svt_memcpy(data + write_offset + tile_size_bytes, ec_output_bitstream_ptr->buffer_begin_av1, tile_size);
3972
4.53k
            write_offset += (tile_size + tile_size_bytes);
3973
4.53k
        }
3974
430
    }
3975
3976
430
    data += total_obu_size;
3977
430
    output_bitstream_ptr->buffer_av1 = data;
3978
430
    return return_error;
3979
430
}
3980
3981
/**************************************************
3982
* svt_aom_encode_sps_av1
3983
**************************************************/
3984
430
EbErrorType svt_aom_encode_sps_av1(Bitstream* bitstream_ptr, SequenceControlSet* scs) {
3985
430
    EbErrorType          return_error             = EB_ErrorNone;
3986
430
    OutputBitstreamUnit* output_bitstream_ptr     = (OutputBitstreamUnit*)bitstream_ptr->output_bitstream_ptr;
3987
430
    uint8_t*             data                     = output_bitstream_ptr->buffer_av1;
3988
430
    const uint8_t        enhancement_layers_count = 0; // cm->enhancement_layers_count;
3989
3990
    // Phase 1: measure
3991
430
    uint32_t obu_header_size   = write_obu_header(OBU_SEQUENCE_HEADER, 0, data);
3992
430
    uint32_t obu_payload_size  = write_sequence_header_obu(scs, data + obu_header_size, enhancement_layers_count);
3993
430
    size_t   length_field_size = svt_aom_uleb_size_in_bytes(obu_payload_size);
3994
3995
    // Phase 2: write at correct offsets (re-write payload after LEB128)
3996
430
    size_t  coded_size;
3997
430
    int32_t ret = svt_aom_uleb_encode(obu_payload_size, sizeof(obu_payload_size), data + obu_header_size, &coded_size);
3998
430
    assert(ret == 0 && coded_size == length_field_size);
3999
430
    if (ret != 0 || coded_size != length_field_size) {
4000
0
        return EB_ErrorBadParameter;
4001
0
    }
4002
430
    write_sequence_header_obu(scs, data + obu_header_size + length_field_size, enhancement_layers_count);
4003
4004
430
    data += obu_header_size + length_field_size + obu_payload_size;
4005
430
    output_bitstream_ptr->buffer_av1 = data;
4006
430
    return return_error;
4007
430
}
4008
4009
/**************************************************
4010
* svt_aom_encode_td_av1
4011
**************************************************/
4012
430
EbErrorType svt_aom_encode_td_av1(uint8_t* output_bitstream_ptr) {
4013
430
    assert(output_bitstream_ptr != NULL);
4014
4015
    // move data and insert OBU_TD preceded by optional 4 byte size
4016
    // OBUs are preceded/succeeded by an unsigned leb128 coded integer.
4017
430
    write_uleb_obu_size(write_obu_header(OBU_TEMPORAL_DELIMITER, 0, output_bitstream_ptr), 0, output_bitstream_ptr);
4018
430
    return EB_ErrorNone;
4019
430
}
4020
4021
0
static void av1_write_delta_q_index(FRAME_CONTEXT* frame_context, int32_t delta_qindex, AomWriter* w) {
4022
0
    int32_t sign     = delta_qindex < 0;
4023
0
    int32_t abs      = sign ? -delta_qindex : delta_qindex;
4024
0
    int32_t smallval = abs < DELTA_Q_SMALL ? 1 : 0;
4025
    //FRAME_CONTEXT *ec_ctx = xd->tile_ctx;
4026
4027
0
    aom_write_symbol(w, AOMMIN(abs, DELTA_Q_SMALL), frame_context->delta_q_cdf, DELTA_Q_PROBS + 1);
4028
4029
0
    if (!smallval) {
4030
0
        int32_t rem_bits = svt_log2f(abs - 1);
4031
0
        int32_t thr      = (1 << rem_bits) + 1;
4032
0
        aom_write_literal(w, rem_bits - 1, 3);
4033
0
        aom_write_literal(w, abs - thr, rem_bits);
4034
0
    }
4035
0
    if (abs > 0) {
4036
0
        aom_write_bit(w, sign);
4037
0
    }
4038
0
}
4039
4040
static void write_cdef(SequenceControlSet* scs, PictureControlSet* pcs, EntropyCodingContext* ctx, AomWriter* w,
4041
121k
                       int32_t skip, int32_t mi_col, int32_t mi_row) {
4042
121k
    Av1Common*   cm      = pcs->ppcs->av1_cm;
4043
121k
    FrameHeader* frm_hdr = &pcs->ppcs->frm_hdr;
4044
4045
121k
    if (frm_hdr->coded_lossless || frm_hdr->allow_intrabc) {
4046
        // Initialize to indicate no CDEF for safety.
4047
114k
        frm_hdr->cdef_params.cdef_bits           = 0;
4048
114k
        frm_hdr->cdef_params.cdef_y_strength[0]  = 0;
4049
114k
        pcs->ppcs->nb_cdef_strengths             = 1;
4050
114k
        frm_hdr->cdef_params.cdef_uv_strength[0] = 0;
4051
114k
        return;
4052
114k
    }
4053
4054
7.04k
    const int32_t     m    = ~((1 << (6 - MI_SIZE_LOG2)) - 1);
4055
7.04k
    const MbModeInfo* mbmi = pcs->mi_grid_base[(mi_row & m) * cm->mi_stride + (mi_col & m)];
4056
4057
    // Initialise when at top left part of the superblock
4058
7.04k
    if (!(mi_row & (scs->seq_header.sb_mi_size - 1)) && !(mi_col & (scs->seq_header.sb_mi_size - 1))) { // Top left?
4059
3.41k
        ctx->cdef_transmitted[0] = ctx->cdef_transmitted[1] = ctx->cdef_transmitted[2] = ctx->cdef_transmitted[3] =
4060
3.41k
            false;
4061
3.41k
    }
4062
4063
    // Emit CDEF param at first non-skip coding block
4064
7.04k
    const int32_t mask  = 1 << (6 - MI_SIZE_LOG2);
4065
7.04k
    const int32_t index = scs->seq_header.sb_size == BLOCK_128X128 ? !!(mi_col & mask) + 2 * !!(mi_row & mask) : 0;
4066
4067
7.04k
    if (!ctx->cdef_transmitted[index] && !skip) {
4068
3.07k
        aom_write_literal(w, mbmi->cdef_strength, frm_hdr->cdef_params.cdef_bits);
4069
3.07k
        ctx->cdef_transmitted[index] = true;
4070
3.07k
    }
4071
7.04k
}
4072
4073
4.53k
void svt_av1_reset_loop_restoration(EntropyCodingContext* ctx) {
4074
18.1k
    for (int32_t p = 0; p < MAX_PLANES; ++p) {
4075
13.6k
        set_default_wiener(ctx->wiener_info + p);
4076
13.6k
        set_default_sgrproj(ctx->sgrproj_info + p);
4077
13.6k
    }
4078
4.53k
}
4079
4080
static void write_wiener_filter(int32_t wiener_win, const WienerInfo* wiener_info, WienerInfo* ref_wiener_info,
4081
0
                                AomWriter* wb) {
4082
0
    if (wiener_win == WIENER_WIN) {
4083
0
        svt_aom_write_primitive_refsubexpfin(wb,
4084
0
                                             WIENER_FILT_TAP0_MAXV - WIENER_FILT_TAP0_MINV + 1,
4085
0
                                             WIENER_FILT_TAP0_SUBEXP_K,
4086
0
                                             ref_wiener_info->vfilter[0] - WIENER_FILT_TAP0_MINV,
4087
0
                                             wiener_info->vfilter[0] - WIENER_FILT_TAP0_MINV);
4088
0
    } else {
4089
0
        assert(wiener_info->vfilter[0] == 0 && wiener_info->vfilter[WIENER_WIN - 1] == 0);
4090
0
    }
4091
0
    svt_aom_write_primitive_refsubexpfin(wb,
4092
0
                                         WIENER_FILT_TAP1_MAXV - WIENER_FILT_TAP1_MINV + 1,
4093
0
                                         WIENER_FILT_TAP1_SUBEXP_K,
4094
0
                                         ref_wiener_info->vfilter[1] - WIENER_FILT_TAP1_MINV,
4095
0
                                         wiener_info->vfilter[1] - WIENER_FILT_TAP1_MINV);
4096
0
    svt_aom_write_primitive_refsubexpfin(wb,
4097
0
                                         WIENER_FILT_TAP2_MAXV - WIENER_FILT_TAP2_MINV + 1,
4098
0
                                         WIENER_FILT_TAP2_SUBEXP_K,
4099
0
                                         ref_wiener_info->vfilter[2] - WIENER_FILT_TAP2_MINV,
4100
0
                                         wiener_info->vfilter[2] - WIENER_FILT_TAP2_MINV);
4101
0
    if (wiener_win == WIENER_WIN) {
4102
0
        svt_aom_write_primitive_refsubexpfin(wb,
4103
0
                                             WIENER_FILT_TAP0_MAXV - WIENER_FILT_TAP0_MINV + 1,
4104
0
                                             WIENER_FILT_TAP0_SUBEXP_K,
4105
0
                                             ref_wiener_info->hfilter[0] - WIENER_FILT_TAP0_MINV,
4106
0
                                             wiener_info->hfilter[0] - WIENER_FILT_TAP0_MINV);
4107
0
    } else {
4108
0
        assert(wiener_info->hfilter[0] == 0 && wiener_info->hfilter[WIENER_WIN - 1] == 0);
4109
0
    }
4110
0
    svt_aom_write_primitive_refsubexpfin(wb,
4111
0
                                         WIENER_FILT_TAP1_MAXV - WIENER_FILT_TAP1_MINV + 1,
4112
0
                                         WIENER_FILT_TAP1_SUBEXP_K,
4113
0
                                         ref_wiener_info->hfilter[1] - WIENER_FILT_TAP1_MINV,
4114
0
                                         wiener_info->hfilter[1] - WIENER_FILT_TAP1_MINV);
4115
0
    svt_aom_write_primitive_refsubexpfin(wb,
4116
0
                                         WIENER_FILT_TAP2_MAXV - WIENER_FILT_TAP2_MINV + 1,
4117
0
                                         WIENER_FILT_TAP2_SUBEXP_K,
4118
0
                                         ref_wiener_info->hfilter[2] - WIENER_FILT_TAP2_MINV,
4119
0
                                         wiener_info->hfilter[2] - WIENER_FILT_TAP2_MINV);
4120
0
    svt_memcpy(ref_wiener_info, wiener_info, sizeof(*wiener_info));
4121
0
}
4122
4123
0
static void write_sgrproj_filter(const SgrprojInfo* sgrproj_info, SgrprojInfo* ref_sgrproj_info, AomWriter* wb) {
4124
0
    aom_write_literal(wb, sgrproj_info->ep, SGRPROJ_PARAMS_BITS);
4125
0
    const SgrParamsType* params = &svt_aom_eb_sgr_params[sgrproj_info->ep];
4126
4127
0
    if (params->r[0] == 0) {
4128
0
        assert(sgrproj_info->xqd[0] == 0);
4129
0
        svt_aom_write_primitive_refsubexpfin(wb,
4130
0
                                             SGRPROJ_PRJ_MAX1 - SGRPROJ_PRJ_MIN1 + 1,
4131
0
                                             SGRPROJ_PRJ_SUBEXP_K,
4132
0
                                             (uint16_t)(ref_sgrproj_info->xqd[1] - SGRPROJ_PRJ_MIN1),
4133
0
                                             (uint16_t)(sgrproj_info->xqd[1] - SGRPROJ_PRJ_MIN1));
4134
0
    } else if (params->r[1] == 0) {
4135
0
        svt_aom_write_primitive_refsubexpfin(wb,
4136
0
                                             SGRPROJ_PRJ_MAX0 - SGRPROJ_PRJ_MIN0 + 1,
4137
0
                                             SGRPROJ_PRJ_SUBEXP_K,
4138
0
                                             (uint16_t)(ref_sgrproj_info->xqd[0] - SGRPROJ_PRJ_MIN0),
4139
0
                                             (uint16_t)(sgrproj_info->xqd[0] - SGRPROJ_PRJ_MIN0));
4140
0
    } else {
4141
0
        svt_aom_write_primitive_refsubexpfin(wb,
4142
0
                                             SGRPROJ_PRJ_MAX0 - SGRPROJ_PRJ_MIN0 + 1,
4143
0
                                             SGRPROJ_PRJ_SUBEXP_K,
4144
0
                                             (uint16_t)(ref_sgrproj_info->xqd[0] - SGRPROJ_PRJ_MIN0),
4145
0
                                             (uint16_t)(sgrproj_info->xqd[0] - SGRPROJ_PRJ_MIN0));
4146
0
        svt_aom_write_primitive_refsubexpfin(wb,
4147
0
                                             SGRPROJ_PRJ_MAX1 - SGRPROJ_PRJ_MIN1 + 1,
4148
0
                                             SGRPROJ_PRJ_SUBEXP_K,
4149
0
                                             (uint16_t)(ref_sgrproj_info->xqd[1] - SGRPROJ_PRJ_MIN1),
4150
0
                                             (uint16_t)(sgrproj_info->xqd[1] - SGRPROJ_PRJ_MIN1));
4151
0
    }
4152
4153
0
    svt_memcpy(ref_sgrproj_info, sgrproj_info, sizeof(*sgrproj_info));
4154
0
}
4155
4156
static void loop_restoration_write_sb_coeffs(PictureControlSet* pcs, FRAME_CONTEXT* frame_context,
4157
                                             EntropyCodingContext* ctx, const RestorationUnitInfo* rui,
4158
0
                                             AomWriter* const w, int32_t plane) {
4159
0
    const RestorationInfo* rsi         = pcs->rst_info + plane;
4160
0
    RestorationType        frame_rtype = rsi->frame_restoration_type;
4161
0
    if (frame_rtype == RESTORE_NONE) {
4162
0
        return;
4163
0
    }
4164
4165
0
    const int32_t   wiener_win   = (plane > 0) ? WIENER_WIN_CHROMA : WIENER_WIN;
4166
0
    WienerInfo*     wiener_info  = &ctx->wiener_info[plane];
4167
0
    SgrprojInfo*    sgrproj_info = &ctx->sgrproj_info[plane];
4168
0
    RestorationType unit_rtype   = rui->restoration_type;
4169
4170
0
    assert(unit_rtype < CDF_SIZE(RESTORE_SWITCHABLE_TYPES));
4171
4172
0
    if (frame_rtype == RESTORE_SWITCHABLE) {
4173
0
        aom_write_symbol(w,
4174
0
                         unit_rtype,
4175
0
                         /*xd->tile_ctx->*/ frame_context->switchable_restore_cdf,
4176
0
                         RESTORE_SWITCHABLE_TYPES);
4177
0
        switch (unit_rtype) {
4178
0
        case RESTORE_WIENER:
4179
0
            write_wiener_filter(wiener_win, &rui->wiener_info, wiener_info, w);
4180
            //SVT_LOG("POC:%i plane:%i v:%i %i %i  h:%i %i %i\n", piCSetPtr->picture_number, plane, rui->wiener_info.vfilter[0], rui->wiener_info.vfilter[1], rui->wiener_info.vfilter[2], rui->wiener_info.hfilter[0], rui->wiener_info.hfilter[1], rui->wiener_info.hfilter[2]);
4181
0
            break;
4182
0
        case RESTORE_SGRPROJ:
4183
0
            write_sgrproj_filter(&rui->sgrproj_info, sgrproj_info, w);
4184
            //SVT_LOG("POC:%i plane:%i ep:%i xqd_0:%i  xqd_1:%i\n", piCSetPtr->picture_number, plane, rui->sgrproj_info.ep, rui->sgrproj_info.xqd[0], rui->sgrproj_info.xqd[1]);
4185
0
            break;
4186
0
        default:
4187
0
            assert(unit_rtype == RESTORE_NONE); // SVT_LOG("POC:%i plane:%i OFF\n", piCSetPtr->picture_number, plane);
4188
0
            break;
4189
0
        }
4190
0
    } else if (frame_rtype == RESTORE_WIENER) {
4191
0
        aom_write_symbol(w,
4192
0
                         unit_rtype != RESTORE_NONE,
4193
0
                         /*xd->tile_ctx->*/ frame_context->wiener_restore_cdf,
4194
0
                         2);
4195
0
        if (unit_rtype != RESTORE_NONE) {
4196
0
            write_wiener_filter(wiener_win, &rui->wiener_info, wiener_info, w);
4197
            //SVT_LOG("POC:%i plane:%i v:%i %i %i  h:%i %i %i\n", piCSetPtr->picture_number, plane, rui->wiener_info.vfilter[0], rui->wiener_info.vfilter[1], rui->wiener_info.vfilter[2], rui->wiener_info.hfilter[0], rui->wiener_info.hfilter[1], rui->wiener_info.hfilter[2]);
4198
0
        }
4199
        //else
4200
        //SVT_LOG("POC:%i plane:%i OFF\n", piCSetPtr->picture_number, plane);
4201
0
    } else if (frame_rtype == RESTORE_SGRPROJ) {
4202
0
        aom_write_symbol(w,
4203
0
                         unit_rtype != RESTORE_NONE,
4204
0
                         /*xd->tile_ctx->*/ frame_context->sgrproj_restore_cdf,
4205
0
                         2);
4206
0
        if (unit_rtype != RESTORE_NONE) {
4207
0
            write_sgrproj_filter(&rui->sgrproj_info, sgrproj_info, w);
4208
            //SVT_LOG("POC:%i plane:%i ep:%i xqd_0:%i  xqd_1:%i\n", piCSetPtr->picture_number, plane, rui->sgrproj_info.ep, rui->sgrproj_info.xqd[0], rui->sgrproj_info.xqd[1]);
4209
0
        }
4210
        //else
4211
        //    SVT_LOG("POC:%i plane:%i OFF\n", piCSetPtr->picture_number, plane);
4212
0
    }
4213
0
}
4214
4215
static void ec_update_neighbors(PictureControlSet* pcs, EntropyCodingContext* ec_ctx, uint32_t blk_org_x,
4216
121k
                                uint32_t blk_org_y, uint16_t tile_idx, BlockSize bsize) {
4217
121k
    NeighborArrayUnit* partition_context_na        = pcs->partition_context_na[tile_idx];
4218
121k
    NeighborArrayUnit* luma_dc_sign_level_coeff_na = pcs->luma_dc_sign_level_coeff_na[tile_idx];
4219
121k
    NeighborArrayUnit* cr_dc_sign_level_coeff_na   = pcs->cr_dc_sign_level_coeff_na[tile_idx];
4220
121k
    NeighborArrayUnit* cb_dc_sign_level_coeff_na   = pcs->cb_dc_sign_level_coeff_na[tile_idx];
4221
121k
    MbModeInfo*        mbmi                        = get_mbmi(pcs, blk_org_x, blk_org_y);
4222
121k
    uint8_t            skip_coeff                  = mbmi->block_mi.skip;
4223
121k
    const int          bwidth                      = block_size_wide[bsize];
4224
121k
    const int          bheight                     = block_size_high[bsize];
4225
121k
    const bool         has_uv                      = is_chroma_reference(blk_org_y >> 2, blk_org_x >> 2, bsize, 1, 1);
4226
4227
    // Update the Leaf Depth Neighbor Array
4228
121k
    svt_aom_neighbor_array_unit_mode_write_pu(partition_context_na,
4229
121k
                                              (uint8_t*)&partition_context_lookup[bsize].above,
4230
121k
                                              blk_org_x,
4231
121k
                                              blk_org_y,
4232
121k
                                              bwidth,
4233
121k
                                              bheight,
4234
121k
                                              NEIGHBOR_ARRAY_UNIT_TOP_MASK);
4235
121k
    svt_aom_neighbor_array_unit_mode_write_pu(partition_context_na,
4236
121k
                                              (uint8_t*)&partition_context_lookup[bsize].left,
4237
121k
                                              blk_org_x,
4238
121k
                                              blk_org_y,
4239
121k
                                              bwidth,
4240
121k
                                              bheight,
4241
121k
                                              NEIGHBOR_ARRAY_UNIT_LEFT_MASK);
4242
121k
    if (skip_coeff) {
4243
115k
        uint8_t dc_sign_level_coeff = 0;
4244
4245
115k
        svt_aom_neighbor_array_unit_mode_write_pu(luma_dc_sign_level_coeff_na,
4246
115k
                                                  (uint8_t*)&dc_sign_level_coeff,
4247
115k
                                                  blk_org_x,
4248
115k
                                                  blk_org_y,
4249
115k
                                                  bwidth,
4250
115k
                                                  bheight,
4251
115k
                                                  NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
4252
4253
115k
        if (has_uv) {
4254
115k
            const BlockSize bsize_uv   = get_plane_block_size(bsize, 1, 1);
4255
115k
            const int       bwidth_uv  = block_size_wide[bsize_uv];
4256
115k
            const int       bheight_uv = block_size_high[bsize_uv];
4257
115k
            svt_aom_neighbor_array_unit_mode_write_pu(cb_dc_sign_level_coeff_na,
4258
115k
                                                      &dc_sign_level_coeff,
4259
115k
                                                      ((blk_org_x >> 3) << 3) >> 1,
4260
115k
                                                      ((blk_org_y >> 3) << 3) >> 1,
4261
115k
                                                      bwidth_uv,
4262
115k
                                                      bheight_uv,
4263
115k
                                                      NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
4264
115k
            svt_aom_neighbor_array_unit_mode_write_pu(cr_dc_sign_level_coeff_na,
4265
115k
                                                      &dc_sign_level_coeff,
4266
115k
                                                      ((blk_org_x >> 3) << 3) >> 1,
4267
115k
                                                      ((blk_org_y >> 3) << 3) >> 1,
4268
115k
                                                      bwidth_uv,
4269
115k
                                                      bheight_uv,
4270
115k
                                                      NEIGHBOR_ARRAY_UNIT_TOP_AND_LEFT_ONLY_MASK);
4271
115k
            ec_ctx->coded_area_sb_uv += bwidth_uv * bheight_uv;
4272
115k
        }
4273
115k
        ec_ctx->coded_area_sb += bwidth * bheight;
4274
115k
    }
4275
121k
}
4276
4277
362k
int svt_aom_allow_palette(int allow_screen_content_tools, BlockSize bsize) {
4278
362k
    return allow_screen_content_tools && block_size_wide[bsize] <= 64 && block_size_high[bsize] <= 64 &&
4279
0
        bsize >= BLOCK_8X8;
4280
362k
}
4281
4282
0
int svt_aom_get_palette_bsize_ctx(BlockSize bsize) {
4283
0
    return eb_num_pels_log2_lookup[bsize] - eb_num_pels_log2_lookup[BLOCK_8X8];
4284
0
}
4285
4286
void svt_av1_tokenize_color_map(FRAME_CONTEXT* frame_context, EcBlkStruct* blk_ptr, int plane, TOKENEXTRA** t,
4287
                                BlockSize bsize, TxSize tx_size, COLOR_MAP_TYPE type, int allow_update_cdf);
4288
void svt_aom_get_block_dimensions(BlockSize bsize, int plane, const MacroBlockD* xd, int* width, int* height,
4289
                                  int* rows_within_bounds, int* cols_within_bounds);
4290
int  svt_get_palette_cache_y(const MacroBlockD* const xd, uint16_t* cache);
4291
int  svt_av1_index_color_cache(const uint16_t* color_cache, int n_cache, const uint16_t* colors, int n_colors,
4292
                               uint8_t* cache_color_found, int* out_cache_colors);
4293
4294
0
int svt_aom_get_palette_mode_ctx(const MacroBlockD* xd) {
4295
0
    const MbModeInfo* const above_mi = xd->above_mbmi;
4296
0
    const MbModeInfo* const left_mi  = xd->left_mbmi;
4297
0
    int                     ctx      = 0;
4298
0
    if (above_mi) {
4299
0
        ctx += (above_mi->palette_mode_info.palette_size > 0);
4300
0
    }
4301
0
    if (left_mi) {
4302
0
        ctx += (left_mi->palette_mode_info.palette_size > 0);
4303
0
    }
4304
0
    return ctx;
4305
0
}
4306
4307
// Transmit color values with delta encoding. Write the first value as
4308
// literal, and the deltas between each value and the previous one. "min_val" is
4309
// the smallest possible value of the deltas.
4310
static AOM_INLINE void delta_encode_palette_colors(const int* colors, int num, int bit_depth, int min_val,
4311
0
                                                   AomWriter* w) {
4312
0
    if (num <= 0) {
4313
0
        return;
4314
0
    }
4315
0
    assert(colors[0] < (1 << bit_depth));
4316
0
    aom_write_literal(w, colors[0], bit_depth);
4317
0
    if (num == 1) {
4318
0
        return;
4319
0
    }
4320
0
    int max_delta = 0;
4321
0
    int deltas[PALETTE_MAX_SIZE];
4322
0
    memset(deltas, 0, sizeof(deltas));
4323
0
    for (int i = 1; i < num; ++i) {
4324
0
        assert(colors[i] < (1 << bit_depth));
4325
0
        const int delta = colors[i] - colors[i - 1];
4326
0
        deltas[i - 1]   = delta;
4327
0
        assert(delta >= min_val);
4328
0
        if (delta > max_delta) {
4329
0
            max_delta = delta;
4330
0
        }
4331
0
    }
4332
0
    const int min_bits = bit_depth - 3;
4333
0
    int       bits     = AOMMAX(av1_ceil_log2(max_delta + 1 - min_val), min_bits);
4334
0
    assert(bits <= bit_depth);
4335
0
    int range = (1 << bit_depth) - colors[0] - min_val;
4336
0
    aom_write_literal(w, bits - min_bits, 2);
4337
0
    for (int i = 0; i < num - 1; ++i) {
4338
0
        aom_write_literal(w, deltas[i] - min_val, bits);
4339
0
        range -= deltas[i];
4340
0
        bits = AOMMIN(bits, av1_ceil_log2(range));
4341
0
    }
4342
0
}
4343
4344
0
static INLINE int get_unsigned_bits(unsigned int num_values) {
4345
0
    return num_values > 0 ? get_msb(num_values) + 1 : 0;
4346
0
}
4347
4348
0
static INLINE void write_uniform(AomWriter* w, int n, int v) {
4349
0
    const int l = get_unsigned_bits(n);
4350
0
    const int m = (1 << l) - n;
4351
0
    if (l == 0) {
4352
0
        return;
4353
0
    }
4354
0
    if (v < m) {
4355
0
        aom_write_literal(w, v, l - 1);
4356
0
    } else {
4357
0
        aom_write_literal(w, m + ((v - m) >> 1), l - 1);
4358
0
        aom_write_literal(w, (v - m) & 1, 1);
4359
0
    }
4360
0
}
4361
4362
0
int svt_aom_write_uniform_cost(int n, int v) {
4363
0
    const int l = get_unsigned_bits(n);
4364
0
    const int m = (1 << l) - n;
4365
0
    if (l == 0) {
4366
0
        return 0;
4367
0
    }
4368
0
    if (v < m) {
4369
0
        return av1_cost_literal(l - 1);
4370
0
    } else {
4371
0
        return av1_cost_literal(l);
4372
0
    }
4373
0
}
4374
4375
// Transmit luma palette color values. First signal if each color in the color
4376
// cache is used. Those colors that are not in the cache are transmitted with
4377
// delta encoding.
4378
static AOM_INLINE void write_palette_colors_y(const MacroBlockD* const xd, const PaletteModeInfo* const pmi,
4379
0
                                              int bit_depth, AomWriter* w, const int palette_size) {
4380
0
    const int n = palette_size;
4381
0
    uint16_t  color_cache[2 * PALETTE_MAX_SIZE];
4382
0
    const int n_cache = svt_get_palette_cache_y(xd, color_cache);
4383
0
    int       out_cache_colors[PALETTE_MAX_SIZE];
4384
0
    uint8_t   cache_color_found[2 * PALETTE_MAX_SIZE];
4385
0
    const int n_out_cache = svt_av1_index_color_cache(
4386
0
        color_cache, n_cache, pmi->palette_colors, n, cache_color_found, out_cache_colors);
4387
0
    int n_in_cache = 0;
4388
0
    for (int i = 0; i < n_cache && n_in_cache < n; ++i) {
4389
0
        const int found = cache_color_found[i];
4390
0
        aom_write_bit(w, found);
4391
0
        n_in_cache += found;
4392
0
    }
4393
0
    assert(n_in_cache + n_out_cache == n);
4394
0
    delta_encode_palette_colors(out_cache_colors, n_out_cache, bit_depth, 1, w);
4395
0
}
4396
4397
0
static inline void pack_map_tokens(AomWriter* w, const TOKENEXTRA** tp, int n, int num) {
4398
0
    const TOKENEXTRA* p = *tp;
4399
0
    write_uniform(w, n, p->token); // The first color index.
4400
0
    ++p;
4401
0
    --num;
4402
0
    for (int i = 0; i < num; ++i) {
4403
0
        aom_write_symbol(w, p->token, p->color_map_cdf, n);
4404
0
        ++p;
4405
0
    }
4406
0
    *tp = p;
4407
0
}
4408
4409
static void write_palette_mode_info(PictureParentControlSet* ppcs, FRAME_CONTEXT* ec_ctx, MbModeInfo* mbmi,
4410
0
                                    EcBlkStruct* blk_ptr, BlockSize bsize, int mi_row, int mi_col, AomWriter* w) {
4411
0
    const uint32_t intra_luma_mode   = mbmi->block_mi.mode;
4412
0
    uint32_t       intra_chroma_mode = mbmi->block_mi.uv_mode;
4413
4414
0
    const PaletteModeInfo* const pmi       = &blk_ptr->palette_info->pmi;
4415
0
    const int                    bsize_ctx = svt_aom_get_palette_bsize_ctx(bsize);
4416
0
    assert(bsize_ctx >= 0);
4417
0
    if (intra_luma_mode == DC_PRED) {
4418
0
        const int n                  = blk_ptr->palette_size[0];
4419
0
        const int palette_y_mode_ctx = svt_aom_get_palette_mode_ctx(blk_ptr->av1xd);
4420
0
        aom_write_symbol(w, n > 0, ec_ctx->palette_y_mode_cdf[bsize_ctx][palette_y_mode_ctx], 2);
4421
0
        if (n > 0) {
4422
0
            aom_write_symbol(w, n - PALETTE_MIN_SIZE, ec_ctx->palette_y_size_cdf[bsize_ctx], PALETTE_SIZES);
4423
0
            write_palette_colors_y(blk_ptr->av1xd, pmi, ppcs->scs->static_config.encoder_bit_depth, w, n);
4424
0
        }
4425
0
    }
4426
4427
0
    const int uv_dc_pred = intra_chroma_mode == UV_DC_PRED && is_chroma_reference(mi_row, mi_col, bsize, 1, 1);
4428
0
    if (uv_dc_pred) {
4429
0
        assert(blk_ptr->palette_size[1] == 0); //remove when chroma is on
4430
0
        const int palette_uv_mode_ctx = (blk_ptr->palette_size[0] > 0);
4431
0
        aom_write_symbol(w, 0, ec_ctx->palette_uv_mode_cdf[palette_uv_mode_ctx], 2);
4432
0
    }
4433
0
}
4434
4435
0
void svt_av1_encode_dv(AomWriter* w, const Mv* mv, const Mv* ref, NmvContext* mvctx) {
4436
    // DV and ref DV should not have sub-pel.
4437
0
    assert((mv->x & 7) == 0);
4438
0
    assert((mv->y & 7) == 0);
4439
0
    assert((ref->x & 7) == 0);
4440
0
    assert((ref->y & 7) == 0);
4441
    // The y-component (row component) of the MV is coded first
4442
0
    const Mv          diff = {{mv->x - ref->x, mv->y - ref->y}};
4443
0
    const MvJointType j    = svt_av1_get_mv_joint(&diff);
4444
4445
0
    aom_write_symbol(w, j, mvctx->joints_cdf, MV_JOINTS);
4446
0
    if (mv_joint_vertical(j)) {
4447
0
        encode_mv_component(w, diff.y, &mvctx->comps[0], MV_SUBPEL_NONE);
4448
0
    }
4449
4450
0
    if (mv_joint_horizontal(j)) {
4451
0
        encode_mv_component(w, diff.x, &mvctx->comps[1], MV_SUBPEL_NONE);
4452
0
    }
4453
0
}
4454
4455
362k
int svt_aom_allow_intrabc(const FrameHeader* frm_hdr, SliceType slice_type) {
4456
363k
    return (slice_type == I_SLICE && frm_hdr->allow_screen_content_tools && frm_hdr->allow_intrabc);
4457
362k
}
4458
4459
0
static void write_intrabc_info(FRAME_CONTEXT* ec_ctx, MbModeInfo* mbmi, EcBlkStruct* blk_ptr, AomWriter* w) {
4460
0
    int use_intrabc = mbmi->block_mi.use_intrabc;
4461
0
    aom_write_symbol(w, use_intrabc, ec_ctx->intrabc_cdf, 2);
4462
0
    if (use_intrabc) {
4463
        //assert(mbmi->mode == DC_PRED);
4464
        //assert(mbmi->uv_mode == UV_DC_PRED);
4465
        //assert(mbmi->motion_mode == SIMPLE_TRANSLATION);
4466
0
        Mv dv_ref = blk_ptr->predmv[0];
4467
0
        Mv mv     = mbmi->block_mi.mv[INTRA_FRAME];
4468
0
        svt_av1_encode_dv(w, &mv, &dv_ref, &ec_ctx->ndvc);
4469
0
    }
4470
0
}
4471
4472
128k
static INLINE int block_signals_txsize(BlockSize bsize) {
4473
128k
    return bsize > BLOCK_4X4;
4474
128k
}
4475
4476
0
static INLINE int get_vartx_max_txsize(/*const MbModeInfo *xd,*/ BlockSize bsize, int plane) {
4477
    /* if (xd->lossless[xd->mi[0]->segment_id]) return TX_4X4;*/
4478
0
    const TxSize max_txsize = blocksize_to_txsize[bsize];
4479
0
    if (plane == 0) {
4480
0
        return max_txsize; // luma
4481
0
    }
4482
0
    return av1_get_adjusted_tx_size(max_txsize); // chroma
4483
0
}
4484
4485
0
static INLINE int max_block_wide(const MacroBlockD* xd, BlockSize bsize, int plane) {
4486
0
    int max_blocks_wide = block_size_wide[bsize];
4487
4488
0
    if (xd->mb_to_right_edge < 0) {
4489
0
        max_blocks_wide += gcc_right_shift(xd->mb_to_right_edge, 3 + !!plane);
4490
0
    }
4491
4492
    // Scale the width in the transform block unit.
4493
0
    return max_blocks_wide >> tx_size_wide_log2[0];
4494
0
}
4495
4496
0
static INLINE int max_block_high(const MacroBlockD* xd, BlockSize bsize, int plane) {
4497
0
    int max_blocks_high = block_size_high[bsize];
4498
4499
0
    if (xd->mb_to_bottom_edge < 0) {
4500
0
        max_blocks_high += gcc_right_shift(xd->mb_to_bottom_edge, 3 + !!plane);
4501
0
    }
4502
4503
    // Scale the height in the transform block unit.
4504
0
    return max_blocks_high >> tx_size_high_log2[0];
4505
0
}
4506
4507
static INLINE void txfm_partition_update(TXFM_CONTEXT* above_ctx, TXFM_CONTEXT* left_ctx, TxSize tx_size,
4508
0
                                         TxSize txb_size) {
4509
0
    BlockSize bsize = txsize_to_bsize[txb_size];
4510
0
    assert(bsize < BLOCK_SIZES_ALL);
4511
0
    int     bh  = mi_size_high[bsize];
4512
0
    int     bw  = mi_size_wide[bsize];
4513
0
    uint8_t txw = tx_size_wide[tx_size];
4514
0
    uint8_t txh = tx_size_high[tx_size];
4515
0
    int     i;
4516
0
    for (i = 0; i < bh; ++i) {
4517
0
        left_ctx[i] = txh;
4518
0
    }
4519
0
    for (i = 0; i < bw; ++i) {
4520
0
        above_ctx[i] = txw;
4521
0
    }
4522
0
}
4523
4524
0
static INLINE TxSize get_sqr_tx_size(int tx_dim) {
4525
0
    switch (tx_dim) {
4526
0
    case 128:
4527
0
    case 64:
4528
0
        return TX_64X64;
4529
0
        break;
4530
0
    case 32:
4531
0
        return TX_32X32;
4532
0
        break;
4533
0
    case 16:
4534
0
        return TX_16X16;
4535
0
        break;
4536
0
    case 8:
4537
0
        return TX_8X8;
4538
0
        break;
4539
0
    default:
4540
0
        return TX_4X4;
4541
0
    }
4542
0
}
4543
4544
static INLINE int txfm_partition_context(TXFM_CONTEXT* above_ctx, TXFM_CONTEXT* left_ctx, BlockSize bsize,
4545
0
                                         TxSize tx_size) {
4546
0
    const uint8_t txw      = tx_size_wide[tx_size];
4547
0
    const uint8_t txh      = tx_size_high[tx_size];
4548
0
    const int     above    = *above_ctx < txw;
4549
0
    const int     left     = *left_ctx < txh;
4550
0
    int           category = TXFM_PARTITION_CONTEXTS;
4551
4552
    // dummy return, not used by others.
4553
0
    if (tx_size == TX_4X4) {
4554
0
        return 0;
4555
0
    }
4556
4557
0
    TxSize max_tx_size = get_sqr_tx_size(AOMMAX(block_size_wide[bsize], block_size_high[bsize]));
4558
4559
0
    if (max_tx_size >= TX_8X8) {
4560
0
        category = (txsize_sqr_up_map[tx_size] != max_tx_size && max_tx_size > TX_8X8) +
4561
0
            (TX_SIZES - 1 - max_tx_size) * 2;
4562
0
    }
4563
0
    assert(category != TXFM_PARTITION_CONTEXTS);
4564
0
    return category * 3 + above + left;
4565
0
}
4566
4567
static void write_tx_size_vartx(MacroBlockD* xd, const MbModeInfo* mbmi, TxSize tx_size, int depth, int blk_row,
4568
0
                                int blk_col, FRAME_CONTEXT* ec_ctx, AomWriter* w) {
4569
0
    const int max_blocks_high = max_block_high(xd, mbmi->bsize, 0);
4570
0
    const int max_blocks_wide = max_block_wide(xd, mbmi->bsize, 0);
4571
4572
0
    if (blk_row >= max_blocks_high || blk_col >= max_blocks_wide) {
4573
0
        return;
4574
0
    }
4575
4576
0
    if (depth == MAX_VARTX_DEPTH) {
4577
0
        txfm_partition_update(xd->above_txfm_context + blk_col, xd->left_txfm_context + blk_row, tx_size, tx_size);
4578
0
        return;
4579
0
    }
4580
4581
0
    const int ctx = txfm_partition_context(
4582
0
        xd->above_txfm_context + blk_col, xd->left_txfm_context + blk_row, mbmi->bsize, tx_size);
4583
0
    const int write_txfm_partition = (tx_size == tx_depth_to_tx_size[mbmi->block_mi.tx_depth][mbmi->bsize]);
4584
4585
0
    if (write_txfm_partition) {
4586
0
        aom_write_symbol(w, 0, ec_ctx->txfm_partition_cdf[ctx], 2);
4587
4588
0
        txfm_partition_update(xd->above_txfm_context + blk_col, xd->left_txfm_context + blk_row, tx_size, tx_size);
4589
0
    } else {
4590
0
        ASSERT(tx_size < TX_SIZES_ALL);
4591
0
        const TxSize sub_txs = eb_sub_tx_size_map[tx_size];
4592
0
        const int    bsw     = eb_tx_size_wide_unit[sub_txs];
4593
0
        const int    bsh     = eb_tx_size_high_unit[sub_txs];
4594
4595
0
        aom_write_symbol(w, 1, ec_ctx->txfm_partition_cdf[ctx], 2);
4596
4597
0
        if (sub_txs == TX_4X4) {
4598
0
            txfm_partition_update(xd->above_txfm_context + blk_col, xd->left_txfm_context + blk_row, sub_txs, tx_size);
4599
0
            return;
4600
0
        }
4601
4602
0
        assert(bsw > 0 && bsh > 0);
4603
0
        for (int row = 0; row < eb_tx_size_high_unit[tx_size]; row += bsh) {
4604
0
            for (int col = 0; col < eb_tx_size_wide_unit[tx_size]; col += bsw) {
4605
0
                int offsetr = blk_row + row;
4606
0
                int offsetc = blk_col + col;
4607
0
                write_tx_size_vartx(xd, mbmi, sub_txs, depth + 1, offsetr, offsetc, ec_ctx, w);
4608
0
            }
4609
0
        }
4610
0
    }
4611
0
}
4612
4613
242k
static INLINE void set_txfm_ctx(TXFM_CONTEXT* txfm_ctx, uint8_t txs, int len) {
4614
242k
    int i;
4615
805k
    for (i = 0; i < len; ++i) {
4616
563k
        txfm_ctx[i] = txs;
4617
563k
    }
4618
242k
}
4619
4620
121k
static INLINE void set_txfm_ctxs(TxSize tx_size, int n8_w, int n8_h, int skip, const MacroBlockD* xd) {
4621
121k
    uint8_t bw = tx_size_wide[tx_size];
4622
121k
    uint8_t bh = tx_size_high[tx_size];
4623
4624
121k
    if (skip) {
4625
0
        bw = n8_w * MI_SIZE;
4626
0
        bh = n8_h * MI_SIZE;
4627
0
    }
4628
4629
121k
    set_txfm_ctx(xd->above_txfm_context, bw, n8_w);
4630
121k
    set_txfm_ctx(xd->left_txfm_context, bh, n8_h);
4631
121k
}
4632
4633
7.04k
static INLINE int tx_size_to_depth(TxSize tx_size, BlockSize bsize) {
4634
7.04k
    TxSize ctx_size = blocksize_to_txsize[bsize];
4635
7.04k
    int    depth    = 0;
4636
7.04k
    while (tx_size != ctx_size) {
4637
0
        depth++;
4638
0
        ctx_size = eb_sub_tx_size_map[ctx_size];
4639
0
        assert(depth <= MAX_TX_DEPTH);
4640
0
    }
4641
7.04k
    return depth;
4642
7.04k
}
4643
4644
// Returns a context number for the given MB prediction signal
4645
// The mode info data structure has a one element border above and to the
4646
// left of the entries corresponding to real blocks.
4647
// The prediction flags in these dummy entries are initialized to 0.
4648
7.04k
static INLINE int get_tx_size_context(const MacroBlockD* xd) {
4649
7.04k
    const MbModeInfo*       mbmi        = xd->mi[0];
4650
7.04k
    const MbModeInfo* const above_mbmi  = xd->above_mbmi;
4651
7.04k
    const MbModeInfo* const left_mbmi   = xd->left_mbmi;
4652
7.04k
    const TxSize            max_tx_size = blocksize_to_txsize[mbmi->bsize];
4653
7.04k
    const int               max_tx_wide = tx_size_wide[max_tx_size];
4654
7.04k
    const int               max_tx_high = tx_size_high[max_tx_size];
4655
7.04k
    const int               has_above   = xd->up_available;
4656
7.04k
    const int               has_left    = xd->left_available;
4657
4658
7.04k
    int above = xd->above_txfm_context[0] >= max_tx_wide;
4659
7.04k
    int left  = xd->left_txfm_context[0] >= max_tx_high;
4660
4661
7.04k
    if (has_above) {
4662
2.41k
        if (is_inter_block(&above_mbmi->block_mi)) {
4663
0
            above = block_size_wide[above_mbmi->bsize] >= max_tx_wide;
4664
0
        }
4665
2.41k
    }
4666
4667
7.04k
    if (has_left) {
4668
2.21k
        if (is_inter_block(&left_mbmi->block_mi)) {
4669
0
            left = block_size_high[left_mbmi->bsize] >= max_tx_high;
4670
0
        }
4671
2.21k
    }
4672
4673
7.04k
    if (has_above && has_left) {
4674
140
        return (above + left);
4675
6.90k
    } else if (has_above) {
4676
2.27k
        return above;
4677
4.63k
    } else if (has_left) {
4678
2.07k
        return left;
4679
2.55k
    } else {
4680
2.55k
        return 0;
4681
2.55k
    }
4682
7.04k
}
4683
4684
7.04k
static void write_selected_tx_size(const MacroBlockD* xd, FRAME_CONTEXT* ec_ctx, AomWriter* w, TxSize tx_size) {
4685
7.04k
    const MbModeInfo* const mbmi  = xd->mi[0];
4686
7.04k
    const BlockSize         bsize = mbmi->bsize;
4687
4688
7.04k
    if (block_signals_txsize(bsize)) {
4689
7.04k
        const int tx_size_ctx = get_tx_size_context(xd);
4690
7.04k
        assert(bsize < BLOCK_SIZES_ALL);
4691
7.04k
        const int     depth       = tx_size_to_depth(tx_size, bsize);
4692
7.04k
        const int     max_depths  = bsize_to_max_depth(bsize);
4693
7.04k
        const int32_t tx_size_cat = bsize_to_tx_size_cat(bsize);
4694
4695
7.04k
        assert(depth >= 0 && depth <= max_depths);
4696
7.04k
        assert(!is_inter_block(&mbmi->block_mi));
4697
7.04k
        assert(IMPLIES(is_rect_tx(tx_size), is_rect_tx_allowed(/*xd,*/ mbmi)));
4698
4699
7.04k
        aom_write_symbol(w, depth, ec_ctx->tx_size_cdf[tx_size_cat][tx_size_ctx], max_depths + 1);
4700
7.04k
    }
4701
7.04k
}
4702
4703
static EbErrorType av1_code_tx_size(PictureControlSet* pcs, int segment_id, FRAME_CONTEXT* ec_ctx, AomWriter* w,
4704
                                    MacroBlockD* xd, const MbModeInfo* mbmi, TxSize tx_size, TxMode tx_mode,
4705
121k
                                    BlockSize bsize, uint8_t skip) {
4706
121k
    EbErrorType return_error = EB_ErrorNone;
4707
121k
    int         is_inter_tx  = is_inter_block(&mbmi->block_mi);
4708
    //int skip = mbmi->skip;
4709
    //int segment_id = 0;// mbmi->segment_id;
4710
121k
    if (tx_mode == TX_MODE_SELECT && block_signals_txsize(bsize) && !(is_inter_tx && skip) &&
4711
121k
        !svt_av1_is_lossless_segment(pcs, segment_id)) {
4712
7.04k
        if (is_inter_tx) { // This implies skip flag is 0.
4713
0
            const TxSize max_tx_size = get_vartx_max_txsize(/*xd,*/ bsize, 0);
4714
0
            const int    txbh        = eb_tx_size_high_unit[max_tx_size];
4715
0
            const int    txbw        = eb_tx_size_wide_unit[max_tx_size];
4716
0
            const int    width       = block_size_wide[bsize] >> tx_size_wide_log2[0];
4717
0
            const int    height      = block_size_high[bsize] >> tx_size_high_log2[0];
4718
0
            int          idx, idy;
4719
0
            for (idy = 0; idy < height; idy += txbh) {
4720
0
                for (idx = 0; idx < width; idx += txbw) {
4721
0
                    write_tx_size_vartx(xd, mbmi, max_tx_size, 0, idy, idx, ec_ctx, w);
4722
0
                }
4723
0
            }
4724
7.04k
        } else {
4725
7.04k
            write_selected_tx_size(xd, ec_ctx, w, tx_size);
4726
7.04k
            set_txfm_ctxs(tx_size, xd->n8_w, xd->n8_h, 0, xd);
4727
7.04k
        }
4728
114k
    } else {
4729
114k
        set_txfm_ctxs(tx_size, xd->n8_w, xd->n8_h, skip && is_inter_tx, xd);
4730
114k
    }
4731
4732
121k
    return return_error;
4733
121k
}
4734
4735
void set_mi_row_col(PictureControlSet* pcs, MacroBlockD* xd, TileInfo* tile, int mi_row, int bh, int mi_col, int bw,
4736
121k
                    uint32_t mi_stride, int mi_rows, int mi_cols) {
4737
121k
    xd->mb_to_top_edge    = -((mi_row * MI_SIZE) * 8);
4738
121k
    xd->mb_to_bottom_edge = ((mi_rows - bh - mi_row) * MI_SIZE) * 8;
4739
121k
    xd->mb_to_left_edge   = -((mi_col * MI_SIZE) * 8);
4740
121k
    xd->mb_to_right_edge  = ((mi_cols - bw - mi_col) * MI_SIZE) * 8;
4741
4742
121k
    xd->mi_stride = mi_stride;
4743
4744
    // Are edges available for intra prediction?
4745
121k
    xd->up_available     = (mi_row > tile->mi_row_start);
4746
121k
    xd->left_available   = (mi_col > tile->mi_col_start);
4747
121k
    const int32_t offset = mi_row * mi_stride + mi_col;
4748
121k
    xd->mi               = pcs->mi_grid_base + offset;
4749
4750
121k
    if (xd->up_available) {
4751
101k
        xd->above_mbmi = xd->mi[-xd->mi_stride];
4752
101k
    } else {
4753
19.9k
        xd->above_mbmi = NULL;
4754
19.9k
    }
4755
4756
121k
    if (xd->left_available) {
4757
101k
        xd->left_mbmi = xd->mi[-1];
4758
101k
    } else {
4759
19.5k
        xd->left_mbmi = NULL;
4760
19.5k
    }
4761
4762
121k
    xd->n8_h        = bh;
4763
121k
    xd->n8_w        = bw;
4764
121k
    xd->is_sec_rect = 0;
4765
121k
    if (xd->n8_w < xd->n8_h) {
4766
        // Only mark is_sec_rect as 1 for the last block.
4767
        // For PARTITION_VERT_4, it would be (0, 0, 0, 1);
4768
        // For other partitions, it would be (0, 1).
4769
0
        if (!((mi_col + xd->n8_w) & (xd->n8_h - 1))) {
4770
0
            xd->is_sec_rect = 1;
4771
0
        }
4772
0
    }
4773
4774
121k
    if (xd->n8_w > xd->n8_h) {
4775
0
        if (mi_row & (xd->n8_w - 1)) {
4776
0
            xd->is_sec_rect = 1;
4777
0
        }
4778
0
    }
4779
121k
}
4780
4781
static INLINE int svt_aom_get_segment_id(Av1Common* cm, const uint8_t* segment_ids, BlockSize bsize, int mi_row,
4782
0
                                         int mi_col) {
4783
0
    const int mi_offset = mi_row * cm->mi_cols + mi_col;
4784
0
    const int bw        = mi_size_wide[bsize];
4785
0
    const int bh        = mi_size_high[bsize];
4786
0
    const int xmis      = AOMMIN(cm->mi_cols - mi_col, bw);
4787
0
    const int ymis      = AOMMIN(cm->mi_rows - mi_row, bh);
4788
0
    int       x, y, segment_id = MAX_SEGMENTS;
4789
4790
0
    for (y = 0; y < ymis; ++y) {
4791
0
        for (x = 0; x < xmis; ++x) {
4792
0
            segment_id = AOMMIN(segment_id, segment_ids[mi_offset + y * cm->mi_cols + x]);
4793
0
        }
4794
0
    }
4795
4796
0
    assert(segment_id >= 0 && segment_id < MAX_SEGMENTS);
4797
0
    return segment_id;
4798
0
}
4799
4800
static void code_tx_size(PictureControlSet* pcs, uint32_t blk_org_x, uint32_t blk_org_y, EcBlkStruct* blk_ptr,
4801
                         const BlockSize bsize, NeighborArrayUnit* txfm_context_array, FRAME_CONTEXT* ec_ctx,
4802
121k
                         AomWriter* w, uint8_t skip) {
4803
121k
    TxMode       tx_mode = pcs->ppcs->frm_hdr.tx_mode;
4804
121k
    Av1Common*   cm      = pcs->ppcs->av1_cm;
4805
121k
    MacroBlockD* xd      = blk_ptr->av1xd;
4806
    // xd fields (mi, up_available, left_available, etc.) are already set by
4807
    // the caller (write_modes_b) via set_mi_row_col — no need to redo.
4808
4809
121k
    const MbModeInfo* const mbmi              = xd->mi[0];
4810
121k
    xd->above_txfm_context                    = (TXFM_CONTEXT*)svt_aom_na_top_ptr_pu(txfm_context_array, blk_org_x);
4811
121k
    xd->left_txfm_context                     = (TXFM_CONTEXT*)svt_aom_na_left_ptr_pu(txfm_context_array, blk_org_y);
4812
121k
    const TxSize             tx_size          = tx_depth_to_tx_size[mbmi->block_mi.tx_depth][bsize];
4813
121k
    FrameHeader*             frm_hdr          = &pcs->ppcs->frm_hdr;
4814
121k
    SegmentationNeighborMap* segmentation_map = pcs->segmentation_neighbor_map;
4815
121k
    int32_t                  mi_row           = blk_org_y >> MI_SIZE_LOG2;
4816
121k
    int32_t                  mi_col           = blk_org_x >> MI_SIZE_LOG2;
4817
121k
    av1_code_tx_size(pcs,
4818
121k
                     frm_hdr->segmentation_params.segmentation_enabled
4819
121k
                         ? svt_aom_get_segment_id(cm, segmentation_map->data, BLOCK_4X4, mi_row, mi_col)
4820
121k
                         : 0,
4821
121k
                     ec_ctx,
4822
121k
                     w,
4823
121k
                     xd,
4824
121k
                     mbmi,
4825
121k
                     tx_size,
4826
121k
                     tx_mode,
4827
121k
                     bsize,
4828
121k
                     skip);
4829
121k
}
4830
4831
int svt_av1_get_spatial_seg_prediction(PictureControlSet* pcs, MacroBlockD* xd, uint32_t blk_org_x, uint32_t blk_org_y,
4832
0
                                       int* cdf_index) {
4833
0
    int prev_ul = -1; // top left segment_id
4834
0
    int prev_l  = -1; // left segment_id
4835
0
    int prev_u  = -1; // top segment_id
4836
4837
0
    uint32_t                 mi_col           = blk_org_x >> MI_SIZE_LOG2;
4838
0
    uint32_t                 mi_row           = blk_org_y >> MI_SIZE_LOG2;
4839
0
    bool                     left_available   = xd->left_available;
4840
0
    bool                     up_available     = xd->up_available;
4841
0
    Av1Common*               cm               = pcs->ppcs->av1_cm;
4842
0
    SegmentationNeighborMap* segmentation_map = pcs->segmentation_neighbor_map;
4843
4844
    //    SVT_LOG("Left available = %d, Up Available = %d ", left_available, up_available);
4845
4846
0
    if ((up_available) && (left_available)) {
4847
0
        prev_ul = svt_aom_get_segment_id(cm, segmentation_map->data, BLOCK_4X4, mi_row - 1, mi_col - 1);
4848
0
    }
4849
4850
0
    if (up_available) {
4851
0
        prev_u = svt_aom_get_segment_id(cm, segmentation_map->data, BLOCK_4X4, mi_row - 1, mi_col - 0);
4852
0
    }
4853
4854
0
    if (left_available) {
4855
0
        prev_l = svt_aom_get_segment_id(cm, segmentation_map->data, BLOCK_4X4, mi_row - 0, mi_col - 1);
4856
0
    }
4857
4858
    // Pick CDF index based on number of matching/out-of-bounds segment IDs.
4859
0
    if (prev_ul < 0 || prev_u < 0 || prev_l < 0) { /* Edge case */
4860
0
        *cdf_index = 0;
4861
0
    } else if ((prev_ul == prev_u) && (prev_ul == prev_l)) {
4862
0
        *cdf_index = 2;
4863
0
    } else if ((prev_ul == prev_u) || (prev_ul == prev_l) || (prev_u == prev_l)) {
4864
0
        *cdf_index = 1;
4865
0
    } else {
4866
0
        *cdf_index = 0;
4867
0
    }
4868
4869
    // If 2 or more are identical returns that as predictor, otherwise prev_l.
4870
0
    if (prev_u == -1) { // edge case
4871
0
        return prev_l == -1 ? 0 : prev_l;
4872
0
    }
4873
0
    if (prev_l == -1) { // edge case
4874
0
        return prev_u;
4875
0
    }
4876
0
    return (prev_ul == prev_u) ? prev_u : prev_l;
4877
0
}
4878
4879
0
int svt_av1_neg_interleave(int x, int ref, int max) {
4880
0
    assert(x < max);
4881
0
    const int diff = x - ref;
4882
0
    if (!ref) {
4883
0
        return x;
4884
0
    }
4885
0
    if (ref >= (max - 1)) {
4886
0
        return -x + max - 1;
4887
0
    }
4888
0
    if (2 * ref < max) {
4889
0
        if (abs(diff) <= ref) {
4890
0
            return diff > 0 ? (diff << 1) - 1 : ((-diff) << 1);
4891
0
        }
4892
0
        return x;
4893
0
    } else {
4894
0
        if (abs(diff) < (max - ref)) {
4895
0
            return diff > 0 ? (diff << 1) - 1 : ((-diff) << 1);
4896
0
        }
4897
0
        return (max - x) - 1;
4898
0
    }
4899
0
}
4900
4901
void svt_av1_update_segmentation_map(PictureControlSet* pcs, BlockSize bsize, uint32_t blk_org_x, uint32_t blk_org_y,
4902
0
                                     uint8_t segment_id) {
4903
0
    Av1Common* cm          = pcs->ppcs->av1_cm;
4904
0
    uint8_t*   segment_ids = pcs->segmentation_neighbor_map->data;
4905
0
    uint32_t   mi_col      = blk_org_x >> MI_SIZE_LOG2;
4906
0
    uint32_t   mi_row      = blk_org_y >> MI_SIZE_LOG2;
4907
0
    const int  mi_offset   = mi_row * cm->mi_cols + mi_col;
4908
0
    const int  bw          = mi_size_wide[bsize];
4909
0
    const int  bh          = mi_size_high[bsize];
4910
0
    const int  xmis        = AOMMIN((int)(cm->mi_cols - mi_col), bw);
4911
0
    const int  ymis        = AOMMIN((int)(cm->mi_rows - mi_row), bh);
4912
0
    int        x, y;
4913
4914
0
    for (y = 0; y < ymis; ++y) {
4915
0
        for (x = 0; x < xmis; ++x) {
4916
0
            segment_ids[mi_offset + y * cm->mi_cols + x] = segment_id;
4917
0
        }
4918
0
    }
4919
0
}
4920
4921
void write_segment_id(PictureControlSet* pcs, FRAME_CONTEXT* frame_context, AomWriter* ecWriter, BlockSize bsize,
4922
0
                      uint32_t blk_org_x, uint32_t blk_org_y, EcBlkStruct* blk_ptr, bool skip_coeff) {
4923
0
    SegmentationParams* segmentation_params = &pcs->ppcs->frm_hdr.segmentation_params;
4924
0
    if (!segmentation_params->segmentation_enabled) {
4925
0
        return;
4926
0
    }
4927
0
    MbModeInfo* mbmi = get_mbmi(pcs, blk_org_x, blk_org_y);
4928
0
    int         cdf_num;
4929
0
    const int   spatial_pred = svt_av1_get_spatial_seg_prediction(pcs, blk_ptr->av1xd, blk_org_x, blk_org_y, &cdf_num);
4930
0
    if (skip_coeff) {
4931
0
        svt_av1_update_segmentation_map(pcs, bsize, blk_org_x, blk_org_y, spatial_pred);
4932
0
        mbmi->segment_id = spatial_pred;
4933
0
        return;
4934
0
    }
4935
0
    const int coded_id = svt_av1_neg_interleave(
4936
0
        mbmi->segment_id, spatial_pred, segmentation_params->last_active_seg_id + 1);
4937
0
    struct segmentation_probs* segp     = &frame_context->seg;
4938
0
    AomCdfProb*                pred_cdf = segp->spatial_pred_seg_cdf[cdf_num];
4939
0
    aom_write_symbol(ecWriter, coded_id, pred_cdf, MAX_SEGMENTS);
4940
0
    svt_av1_update_segmentation_map(pcs, bsize, blk_org_x, blk_org_y, mbmi->segment_id);
4941
0
}
4942
4943
static void write_inter_segment_id(PictureControlSet* pcs, FRAME_CONTEXT* frame_context, AomWriter* ecWriter,
4944
                                   const BlockSize bsize, uint32_t blk_org_x, uint32_t blk_org_y, EcBlkStruct* blk_ptr,
4945
0
                                   bool skip, int pre_skip) {
4946
0
    SegmentationParams* segmentation_params = &pcs->ppcs->frm_hdr.segmentation_params;
4947
0
    if (!segmentation_params->segmentation_enabled) {
4948
0
        return;
4949
0
    }
4950
4951
0
    if (segmentation_params->segmentation_update_map) {
4952
0
        if (pre_skip) {
4953
0
            if (!segmentation_params->seg_id_pre_skip) {
4954
0
                return;
4955
0
            }
4956
0
        } else {
4957
0
            if (segmentation_params->seg_id_pre_skip) {
4958
0
                return;
4959
0
            }
4960
0
            if (skip) {
4961
0
                write_segment_id(pcs, frame_context, ecWriter, bsize, blk_org_x, blk_org_y, blk_ptr, 1);
4962
0
                if (segmentation_params->segmentation_temporal_update) {
4963
0
                    SVT_ERROR("Temporal update is not supported yet! \n");
4964
0
                    assert(0);
4965
                    //                    blk_ptr->seg_id_predicted = 0;
4966
0
                }
4967
0
                return;
4968
0
            }
4969
0
        }
4970
4971
0
        if (segmentation_params->segmentation_temporal_update) {
4972
0
            SVT_ERROR("Temporal update is not supported yet! \n");
4973
0
            assert(0);
4974
4975
0
        } else {
4976
0
            write_segment_id(pcs, frame_context, ecWriter, bsize, blk_org_x, blk_org_y, blk_ptr, 0);
4977
0
        }
4978
0
    }
4979
0
}
4980
4981
0
int svt_aom_is_interintra_allowed(const MbModeInfo* mbmi) {
4982
0
    return svt_aom_is_interintra_allowed_bsize(mbmi->bsize) &&
4983
0
        svt_aom_is_interintra_allowed_mode(mbmi->block_mi.mode) &&
4984
0
        svt_aom_is_interintra_allowed_ref(mbmi->block_mi.ref_frame);
4985
0
}
4986
4987
int svt_aom_is_interintra_wedge_used(BlockSize bsize);
4988
4989
static EbErrorType write_modes_b(PictureControlSet* pcs, EntropyCodingContext* ec_ctx, EntropyCoder* ec,
4990
                                 SuperBlock* sb_ptr, EcBlkStruct* blk_ptr, uint16_t tile_idx,
4991
121k
                                 EbPictureBufferDesc* coeff_ptr, const int mi_row, const int mi_col) {
4992
121k
    EbErrorType         return_error  = EB_ErrorNone;
4993
121k
    FRAME_CONTEXT*      frame_context = ec->fc;
4994
121k
    AomWriter*          ec_writer     = &ec->ec_writer;
4995
121k
    SequenceControlSet* scs           = pcs->scs;
4996
121k
    FrameHeader*        frm_hdr       = &pcs->ppcs->frm_hdr;
4997
4998
121k
    NeighborArrayUnit* luma_dc_sign_level_coeff_na = pcs->luma_dc_sign_level_coeff_na[tile_idx];
4999
121k
    NeighborArrayUnit* cr_dc_sign_level_coeff_na   = pcs->cr_dc_sign_level_coeff_na[tile_idx];
5000
121k
    NeighborArrayUnit* cb_dc_sign_level_coeff_na   = pcs->cb_dc_sign_level_coeff_na[tile_idx];
5001
121k
    NeighborArrayUnit* txfm_context_array          = pcs->txfm_context_array[tile_idx];
5002
121k
    const uint32_t     blk_org_x                   = mi_col << MI_SIZE_LOG2;
5003
121k
    const uint32_t     blk_org_y                   = mi_row << MI_SIZE_LOG2;
5004
121k
    MbModeInfo*        mbmi                        = get_mbmi(pcs, blk_org_x, blk_org_y);
5005
121k
    const BlockSize    bsize                       = mbmi->bsize;
5006
121k
    const int          bwidth                      = block_size_wide[bsize];
5007
121k
    const int          bheight                     = block_size_high[bsize];
5008
121k
    bool               skip_coeff                  = mbmi->block_mi.skip;
5009
121k
    const bool         has_uv                      = is_chroma_reference(blk_org_y >> 2, blk_org_x >> 2, bsize, 1, 1);
5010
121k
    ec_ctx->mbmi                                   = mbmi;
5011
5012
121k
    const uint8_t skip_mode = mbmi->block_mi.skip_mode;
5013
5014
121k
    assert(bsize < BLOCK_SIZES_ALL);
5015
121k
    int mi_stride                     = pcs->ppcs->av1_cm->mi_stride;
5016
121k
    blk_ptr->av1xd->tile.mi_col_start = sb_ptr->tile_info.mi_col_start;
5017
121k
    blk_ptr->av1xd->tile.mi_col_end   = sb_ptr->tile_info.mi_col_end;
5018
121k
    blk_ptr->av1xd->tile.mi_row_start = sb_ptr->tile_info.mi_row_start;
5019
121k
    blk_ptr->av1xd->tile.mi_row_end   = sb_ptr->tile_info.mi_row_end;
5020
121k
    blk_ptr->av1xd->tile_ctx          = frame_context;
5021
5022
121k
    const int32_t bw = mi_size_wide[bsize];
5023
121k
    const int32_t bh = mi_size_high[bsize];
5024
121k
    set_mi_row_col(pcs,
5025
121k
                   blk_ptr->av1xd,
5026
121k
                   &blk_ptr->av1xd->tile,
5027
121k
                   mi_row,
5028
121k
                   bh,
5029
121k
                   mi_col,
5030
121k
                   bw,
5031
121k
                   mi_stride,
5032
121k
                   pcs->ppcs->av1_cm->mi_rows,
5033
121k
                   pcs->ppcs->av1_cm->mi_cols);
5034
121k
    if (pcs->slice_type == I_SLICE) {
5035
        //const int32_t skip = write_skip(cm, xd, mbmi->segment_id, mi, w)
5036
5037
121k
        if (pcs->ppcs->frm_hdr.segmentation_params.segmentation_enabled &&
5038
0
            pcs->ppcs->frm_hdr.segmentation_params.seg_id_pre_skip) {
5039
0
            write_segment_id(pcs, frame_context, ec_writer, bsize, blk_org_x, blk_org_y, blk_ptr, skip_coeff);
5040
0
        }
5041
5042
121k
        encode_skip_coeff_av1(blk_ptr, frame_context, ec_writer, skip_coeff);
5043
5044
121k
        if (pcs->ppcs->frm_hdr.segmentation_params.segmentation_enabled &&
5045
0
            !pcs->ppcs->frm_hdr.segmentation_params.seg_id_pre_skip) {
5046
0
            write_segment_id(pcs, frame_context, ec_writer, bsize, blk_org_x, blk_org_y, blk_ptr, skip_coeff);
5047
0
        }
5048
5049
121k
        write_cdef(scs, pcs, ec_ctx, ec_writer, skip_coeff, blk_org_x >> MI_SIZE_LOG2, blk_org_y >> MI_SIZE_LOG2);
5050
121k
        if (pcs->ppcs->frm_hdr.delta_q_params.delta_q_present) {
5051
0
            int32_t current_q_index        = blk_ptr->qindex;
5052
0
            int32_t super_block_upper_left = (((blk_org_y >> 2) & (scs->seq_header.sb_mi_size - 1)) == 0) &&
5053
0
                (((blk_org_x >> 2) & (scs->seq_header.sb_mi_size - 1)) == 0);
5054
0
            if ((bsize != scs->seq_header.sb_size || skip_coeff == 0) && super_block_upper_left) {
5055
0
                assert(current_q_index > 0);
5056
0
                int32_t reduced_delta_qindex = (current_q_index - pcs->ppcs->prev_qindex[tile_idx]) /
5057
0
                    frm_hdr->delta_q_params.delta_q_res;
5058
5059
                //write_delta_qindex(xd, reduced_delta_qindex, w);
5060
0
                av1_write_delta_q_index(frame_context, reduced_delta_qindex, ec_writer);
5061
                /*if (pcs->picture_number == 0){
5062
                SVT_LOG("%d\t%d\t%d\t%d\n",
5063
                blk_org_x,
5064
                blk_org_y,
5065
                current_q_index,
5066
                pcs->ppcs->prev_qindex);
5067
                }*/
5068
0
                pcs->ppcs->prev_qindex[tile_idx] = current_q_index;
5069
0
            }
5070
0
        }
5071
5072
121k
        {
5073
121k
            const uint32_t intra_luma_mode   = mbmi->block_mi.mode;
5074
121k
            uint32_t       intra_chroma_mode = mbmi->block_mi.uv_mode;
5075
121k
            if (svt_aom_allow_intrabc(&pcs->ppcs->frm_hdr, pcs->ppcs->slice_type)) {
5076
0
                write_intrabc_info(frame_context, mbmi, blk_ptr, ec_writer);
5077
0
            }
5078
121k
            if (mbmi->block_mi.use_intrabc == 0) {
5079
121k
                encode_intra_luma_mode_kf_av1(frame_context, ec_writer, mbmi, blk_ptr, bsize, intra_luma_mode);
5080
121k
            }
5081
121k
            if (mbmi->block_mi.use_intrabc == 0) {
5082
121k
                if (has_uv) {
5083
121k
                    encode_intra_chroma_mode_av1(frame_context,
5084
121k
                                                 ec_writer,
5085
121k
                                                 mbmi,
5086
121k
                                                 bsize,
5087
121k
                                                 intra_luma_mode,
5088
121k
                                                 intra_chroma_mode,
5089
121k
                                                 bwidth <= 32 && bheight <= 32);
5090
121k
                }
5091
121k
            }
5092
121k
            if (mbmi->block_mi.use_intrabc == 0 && svt_aom_allow_palette(frm_hdr->allow_screen_content_tools, bsize)) {
5093
0
                write_palette_mode_info(
5094
5095
0
                    pcs->ppcs,
5096
0
                    frame_context,
5097
0
                    mbmi,
5098
0
                    blk_ptr,
5099
0
                    bsize,
5100
0
                    blk_org_y >> MI_SIZE_LOG2,
5101
0
                    blk_org_x >> MI_SIZE_LOG2,
5102
0
                    ec_writer);
5103
0
            }
5104
121k
            if (mbmi->block_mi.use_intrabc == 0 &&
5105
121k
                svt_aom_filter_intra_allowed(
5106
121k
                    scs->seq_header.filter_intra_level, bsize, blk_ptr->palette_size[0], intra_luma_mode)) {
5107
0
                aom_write_symbol(ec_writer,
5108
0
                                 mbmi->block_mi.filter_intra_mode != FILTER_INTRA_MODES,
5109
0
                                 frame_context->filter_intra_cdfs[bsize],
5110
0
                                 2);
5111
0
                if (mbmi->block_mi.filter_intra_mode != FILTER_INTRA_MODES) {
5112
0
                    aom_write_symbol(ec_writer,
5113
0
                                     mbmi->block_mi.filter_intra_mode,
5114
0
                                     frame_context->filter_intra_mode_cdf,
5115
0
                                     FILTER_INTRA_MODES);
5116
0
                }
5117
0
            }
5118
121k
            if (mbmi->block_mi.use_intrabc == 0) {
5119
121k
                assert(blk_ptr->palette_size[1] == 0);
5120
121k
                TOKENEXTRA* tok = ec_ctx->tok;
5121
363k
                for (int plane = 0; plane < 2; ++plane) {
5122
242k
                    const uint8_t palette_size_plane = blk_ptr->palette_size[plane];
5123
242k
                    if (palette_size_plane > 0) {
5124
0
                        const TxSize tx_size = tx_depth_to_tx_size[mbmi->block_mi.tx_depth][mbmi->bsize];
5125
0
                        svt_av1_tokenize_color_map(
5126
0
                            frame_context,
5127
0
                            blk_ptr,
5128
0
                            plane,
5129
0
                            &tok,
5130
0
                            bsize,
5131
0
                            tx_size,
5132
0
                            PALETTE_MAP,
5133
0
                            0); //NO CDF update in entropy, the update will take place in arithmetic encode
5134
0
                        assert(mbmi->block_mi.use_intrabc == 0);
5135
0
                        assert(svt_aom_allow_palette(pcs->ppcs->frm_hdr.allow_screen_content_tools, bsize));
5136
0
                        int rows, cols;
5137
0
                        svt_aom_get_block_dimensions(bsize, plane, blk_ptr->av1xd, NULL, NULL, &rows, &cols);
5138
0
                        pack_map_tokens(ec_writer, (const TOKENEXTRA**)(&ec_ctx->tok), palette_size_plane, rows * cols);
5139
                        // advance the pointer
5140
0
                        ec_ctx->tok = tok;
5141
0
                    }
5142
242k
                }
5143
121k
            }
5144
121k
            if (frm_hdr->tx_mode == TX_MODE_SELECT) {
5145
121k
                code_tx_size(pcs,
5146
121k
                             blk_org_x,
5147
121k
                             blk_org_y,
5148
121k
                             blk_ptr,
5149
121k
                             bsize,
5150
121k
                             txfm_context_array,
5151
121k
                             frame_context,
5152
121k
                             ec_writer,
5153
121k
                             skip_coeff);
5154
121k
            }
5155
121k
            if (!skip_coeff) {
5156
5.40k
                av1_encode_coeff_1d(pcs,
5157
5.40k
                                    ec_ctx,
5158
5.40k
                                    frame_context,
5159
5.40k
                                    ec_writer,
5160
5.40k
                                    blk_ptr,
5161
5.40k
                                    blk_org_x,
5162
5.40k
                                    blk_org_y,
5163
5.40k
                                    intra_luma_mode,
5164
5.40k
                                    bsize,
5165
5.40k
                                    coeff_ptr,
5166
5.40k
                                    luma_dc_sign_level_coeff_na,
5167
5.40k
                                    cr_dc_sign_level_coeff_na,
5168
5.40k
                                    cb_dc_sign_level_coeff_na);
5169
5.40k
            }
5170
121k
        }
5171
121k
    } else {
5172
0
        write_inter_segment_id(pcs, frame_context, ec_writer, bsize, blk_org_x, blk_org_y, blk_ptr, 0, 1);
5173
0
        if (frm_hdr->skip_mode_params.skip_mode_flag && is_comp_ref_allowed(bsize)) {
5174
0
            encode_skip_mode_av1(blk_ptr, frame_context, ec_writer, skip_mode);
5175
0
        }
5176
0
        if (!frm_hdr->skip_mode_params.skip_mode_flag && skip_mode) {
5177
0
            SVT_ERROR("SKIP not supported\n");
5178
0
        }
5179
0
        if (!skip_mode) {
5180
            // const int32_t skip = write_skip(cm, xd, mbmi->segment_id, mi, w);
5181
0
            encode_skip_coeff_av1(blk_ptr, frame_context, ec_writer, skip_coeff);
5182
0
        }
5183
5184
0
        write_inter_segment_id(pcs, frame_context, ec_writer, bsize, blk_org_x, blk_org_y, blk_ptr, skip_coeff, 0);
5185
0
        write_cdef(scs,
5186
0
                   pcs, /*cm,*/
5187
0
                   ec_ctx,
5188
0
                   ec_writer,
5189
0
                   skip_mode ? 1 : skip_coeff,
5190
0
                   blk_org_x >> MI_SIZE_LOG2,
5191
0
                   blk_org_y >> MI_SIZE_LOG2);
5192
0
        if (pcs->ppcs->frm_hdr.delta_q_params.delta_q_present) {
5193
0
            int32_t current_q_index        = blk_ptr->qindex;
5194
0
            int32_t super_block_upper_left = (((blk_org_y >> 2) & (scs->seq_header.sb_mi_size - 1)) == 0) &&
5195
0
                (((blk_org_x >> 2) & (scs->seq_header.sb_mi_size - 1)) == 0);
5196
0
            if ((bsize != scs->seq_header.sb_size || skip_coeff == 0) && super_block_upper_left) {
5197
0
                assert(current_q_index > 0);
5198
0
                int32_t reduced_delta_qindex = (current_q_index - pcs->ppcs->prev_qindex[tile_idx]) /
5199
0
                    frm_hdr->delta_q_params.delta_q_res;
5200
0
                av1_write_delta_q_index(frame_context, reduced_delta_qindex, ec_writer);
5201
0
                pcs->ppcs->prev_qindex[tile_idx] = current_q_index;
5202
0
            }
5203
0
        }
5204
0
        if (frm_hdr->tx_mode == TX_MODE_SELECT) {
5205
0
            if (skip_mode) {
5206
0
                code_tx_size(
5207
0
                    pcs, blk_org_x, blk_org_y, blk_ptr, bsize, txfm_context_array, frame_context, ec_writer, skip_mode);
5208
0
            }
5209
0
        }
5210
0
        if (!skip_mode) {
5211
0
            write_is_inter(blk_ptr, frame_context, ec_writer, (int32_t)is_inter_mode(ec_ctx->mbmi->block_mi.mode));
5212
0
            if (is_intra_mode(ec_ctx->mbmi->block_mi.mode)) {
5213
0
                uint32_t intra_luma_mode = mbmi->block_mi.mode;
5214
5215
0
                uint32_t intra_chroma_mode = mbmi->block_mi.uv_mode;
5216
5217
0
                encode_intra_luma_mode_nonkey_av1(frame_context, ec_writer, mbmi, bsize, intra_luma_mode);
5218
0
                if (has_uv) {
5219
0
                    encode_intra_chroma_mode_av1(frame_context,
5220
0
                                                 ec_writer,
5221
0
                                                 mbmi,
5222
0
                                                 bsize,
5223
0
                                                 intra_luma_mode,
5224
0
                                                 intra_chroma_mode,
5225
0
                                                 bwidth <= 32 && bheight <= 32);
5226
0
                }
5227
0
                if (svt_aom_allow_palette(pcs->ppcs->frm_hdr.allow_screen_content_tools, bsize)) {
5228
0
                    write_palette_mode_info(pcs->ppcs,
5229
0
                                            frame_context,
5230
0
                                            mbmi,
5231
0
                                            blk_ptr,
5232
0
                                            bsize,
5233
0
                                            blk_org_y >> MI_SIZE_LOG2,
5234
0
                                            blk_org_x >> MI_SIZE_LOG2,
5235
0
                                            ec_writer);
5236
0
                }
5237
0
                if (svt_aom_filter_intra_allowed(
5238
0
                        scs->seq_header.filter_intra_level, bsize, blk_ptr->palette_size[0], intra_luma_mode)) {
5239
0
                    aom_write_symbol(ec_writer,
5240
0
                                     mbmi->block_mi.filter_intra_mode != FILTER_INTRA_MODES,
5241
0
                                     frame_context->filter_intra_cdfs[bsize],
5242
0
                                     2);
5243
0
                    if (mbmi->block_mi.filter_intra_mode != FILTER_INTRA_MODES) {
5244
0
                        aom_write_symbol(ec_writer,
5245
0
                                         mbmi->block_mi.filter_intra_mode,
5246
0
                                         frame_context->filter_intra_mode_cdf,
5247
0
                                         FILTER_INTRA_MODES);
5248
0
                    }
5249
0
                }
5250
5251
0
            } else {
5252
0
                svt_aom_collect_neighbors_ref_counts_new(blk_ptr->av1xd);
5253
5254
0
                write_ref_frames(pcs->ppcs, blk_ptr->av1xd, ec_writer);
5255
5256
0
                MvReferenceFrame* rf          = mbmi->block_mi.ref_frame;
5257
0
                int16_t           mode_ctx    = svt_aom_mode_context_analyzer(blk_ptr->inter_mode_ctx, rf);
5258
0
                PredictionMode    inter_mode  = mbmi->block_mi.mode;
5259
0
                const int32_t     is_compound = is_inter_compound_mode(inter_mode);
5260
5261
                // If segment skip is not enabled code the mode.
5262
0
                if (is_inter_compound_mode(inter_mode)) {
5263
0
                    write_inter_compound_mode(frame_context, ec_writer, inter_mode, mode_ctx);
5264
0
                } else if (is_inter_singleref_mode(inter_mode)) {
5265
0
                    write_inter_mode(frame_context, ec_writer, inter_mode, mode_ctx, blk_org_x, blk_org_y);
5266
0
                }
5267
5268
0
                if (inter_mode == NEWMV || inter_mode == NEW_NEWMV || have_nearmv_in_inter_mode(inter_mode)) {
5269
0
                    write_drl_idx(frame_context, ec_writer, mbmi, blk_ptr);
5270
0
                }
5271
5272
0
                if (inter_mode == NEWMV || inter_mode == NEW_NEWMV) {
5273
0
                    Mv ref_mv;
5274
5275
0
                    for (uint8_t ref = 0; ref < 1 + is_compound; ++ref) {
5276
0
                        NmvContext* nmvc = &frame_context->nmvc;
5277
0
                        ref_mv           = blk_ptr->predmv[ref];
5278
5279
0
                        Mv mv = mbmi->block_mi.mv[ref];
5280
5281
0
                        svt_av1_encode_mv(pcs->ppcs, ec_writer, &mv, &ref_mv, nmvc, frm_hdr->allow_high_precision_mv);
5282
0
                    }
5283
0
                } else if (inter_mode == NEAREST_NEWMV || inter_mode == NEAR_NEWMV) {
5284
0
                    NmvContext* nmvc   = &frame_context->nmvc;
5285
0
                    Mv          ref_mv = blk_ptr->predmv[1];
5286
5287
0
                    Mv mv = mbmi->block_mi.mv[1];
5288
5289
0
                    svt_av1_encode_mv(pcs->ppcs, ec_writer, &mv, &ref_mv, nmvc, frm_hdr->allow_high_precision_mv);
5290
0
                } else if (inter_mode == NEW_NEARESTMV || inter_mode == NEW_NEARMV) {
5291
0
                    NmvContext* nmvc   = &frame_context->nmvc;
5292
0
                    Mv          ref_mv = blk_ptr->predmv[0];
5293
5294
0
                    Mv mv = mbmi->block_mi.mv[0];
5295
5296
0
                    svt_av1_encode_mv(pcs->ppcs, ec_writer, &mv, &ref_mv, nmvc, frm_hdr->allow_high_precision_mv);
5297
0
                }
5298
0
                if (scs->seq_header.enable_interintra_compound && svt_aom_is_interintra_allowed(mbmi)) {
5299
0
                    if (mbmi->block_mi.is_interintra_used) {
5300
0
                        rf[1]                       = INTRA_FRAME;
5301
0
                        mbmi->block_mi.ref_frame[1] = INTRA_FRAME;
5302
0
                    }
5303
5304
0
                    const int interintra  = mbmi->block_mi.is_interintra_used;
5305
0
                    const int bsize_group = eb_size_group_lookup[bsize];
5306
0
                    aom_write_symbol(
5307
0
                        ec_writer, mbmi->block_mi.is_interintra_used, frame_context->interintra_cdf[bsize_group], 2);
5308
0
                    if (interintra) {
5309
0
                        aom_write_symbol(ec_writer,
5310
0
                                         mbmi->block_mi.interintra_mode,
5311
0
                                         frame_context->interintra_mode_cdf[bsize_group],
5312
0
                                         INTERINTRA_MODES);
5313
0
                        if (svt_aom_is_interintra_wedge_used(bsize)) {
5314
0
                            aom_write_symbol(ec_writer,
5315
0
                                             mbmi->block_mi.use_wedge_interintra,
5316
0
                                             frame_context->wedge_interintra_cdf[bsize],
5317
0
                                             2);
5318
0
                            if (mbmi->block_mi.use_wedge_interintra) {
5319
0
                                aom_write_symbol(ec_writer,
5320
0
                                                 mbmi->block_mi.interintra_wedge_index,
5321
0
                                                 frame_context->wedge_idx_cdf[bsize],
5322
0
                                                 16);
5323
0
                            }
5324
0
                        }
5325
0
                    }
5326
0
                }
5327
5328
0
                if (frm_hdr->is_motion_mode_switchable && rf[1] != INTRA_FRAME) {
5329
0
                    write_motion_mode(
5330
0
                        frame_context, ec_writer, bsize, mbmi, mbmi->block_mi.motion_mode, rf[0], rf[1], blk_ptr, pcs);
5331
0
                }
5332
                // First write idx to indicate current compound inter prediction mode group
5333
                // Group A (0): dist_wtd_comp, compound_average
5334
                // Group b (1): interintra, compound_diffwtd, wedge
5335
0
                if (has_second_ref(&mbmi->block_mi)) {
5336
0
                    const int masked_compound_used = is_any_masked_compound_used(bsize) &&
5337
0
                        scs->seq_header.enable_masked_compound;
5338
5339
0
                    if (masked_compound_used) {
5340
0
                        const int ctx_comp_group_idx = svt_aom_get_comp_group_idx_context_enc(blk_ptr->av1xd);
5341
0
                        aom_write_symbol(ec_writer,
5342
0
                                         mbmi->block_mi.comp_group_idx,
5343
0
                                         frame_context->comp_group_idx_cdf[ctx_comp_group_idx],
5344
0
                                         2);
5345
0
                    } else {
5346
0
                        assert(mbmi->block_mi.comp_group_idx == 0);
5347
0
                    }
5348
5349
0
                    if (mbmi->block_mi.comp_group_idx == 0) {
5350
0
                        assert(IMPLIES(mbmi->block_mi.compound_idx,
5351
0
                                       mbmi->block_mi.interinter_comp.type == COMPOUND_AVERAGE));
5352
5353
0
                        if (scs->seq_header.order_hint_info.enable_jnt_comp) {
5354
0
                            const int comp_index_ctx = svt_aom_get_comp_index_context_enc(
5355
0
                                pcs->ppcs,
5356
0
                                pcs->ppcs->cur_order_hint, // cur_frame_index,
5357
0
                                pcs->ppcs->ref_order_hint[rf[0] - 1], // bck_frame_index,
5358
0
                                pcs->ppcs->ref_order_hint[rf[1] - 1], // fwd_frame_index,
5359
0
                                blk_ptr->av1xd);
5360
0
                            aom_write_symbol(ec_writer,
5361
0
                                             mbmi->block_mi.compound_idx,
5362
0
                                             frame_context->compound_index_cdf[comp_index_ctx],
5363
0
                                             2);
5364
0
                        } else {
5365
0
                            assert(mbmi->block_mi.compound_idx == 1);
5366
0
                        }
5367
0
                    } else {
5368
0
                        assert(pcs->ppcs->frm_hdr.reference_mode != SINGLE_REFERENCE &&
5369
0
                               is_inter_compound_mode(mbmi->block_mi.mode) &&
5370
0
                               mbmi->block_mi.motion_mode == SIMPLE_TRANSLATION);
5371
0
                        assert(masked_compound_used);
5372
                        // compound_diffwtd, wedge
5373
0
                        assert(mbmi->block_mi.interinter_comp.type == COMPOUND_WEDGE ||
5374
0
                               mbmi->block_mi.interinter_comp.type == COMPOUND_DIFFWTD);
5375
5376
0
                        if (is_interinter_compound_used(COMPOUND_WEDGE, bsize)) {
5377
0
                            aom_write_symbol(ec_writer,
5378
0
                                             mbmi->block_mi.interinter_comp.type - COMPOUND_WEDGE,
5379
0
                                             frame_context->compound_type_cdf[bsize],
5380
0
                                             MASKED_COMPOUND_TYPES);
5381
0
                        }
5382
5383
0
                        if (mbmi->block_mi.interinter_comp.type == COMPOUND_WEDGE) {
5384
0
                            assert(is_interinter_compound_used(COMPOUND_WEDGE, bsize));
5385
0
                            aom_write_symbol(ec_writer,
5386
0
                                             mbmi->block_mi.interinter_comp.wedge_index,
5387
0
                                             frame_context->wedge_idx_cdf[bsize],
5388
0
                                             16);
5389
0
                            aom_write_bit(ec_writer, mbmi->block_mi.interinter_comp.wedge_sign);
5390
0
                        } else {
5391
0
                            assert(mbmi->block_mi.interinter_comp.type == COMPOUND_DIFFWTD);
5392
0
                            aom_write_literal(
5393
0
                                ec_writer, mbmi->block_mi.interinter_comp.mask_type, MAX_DIFFWTD_MASK_BITS);
5394
0
                        }
5395
0
                    }
5396
0
                }
5397
0
                write_mb_interp_filter(bsize, rf[0], rf[1], pcs->ppcs, ec_writer, mbmi, blk_ptr, ec);
5398
0
            }
5399
0
            {
5400
0
                assert(blk_ptr->palette_size[1] == 0);
5401
0
                TOKENEXTRA* tok = ec_ctx->tok;
5402
0
                for (int plane = 0; plane < 2; ++plane) {
5403
0
                    const uint8_t palette_size_plane = blk_ptr->palette_size[plane];
5404
0
                    if (palette_size_plane > 0) {
5405
0
                        const TxSize tx_size = tx_depth_to_tx_size[mbmi->block_mi.tx_depth][mbmi->bsize];
5406
0
                        svt_av1_tokenize_color_map(
5407
0
                            frame_context,
5408
0
                            blk_ptr,
5409
0
                            plane,
5410
0
                            &tok,
5411
0
                            bsize,
5412
0
                            tx_size,
5413
0
                            PALETTE_MAP,
5414
0
                            0); //NO CDF update in entropy, the update will take place in arithmetic encode
5415
0
                        assert(mbmi->block_mi.use_intrabc == 0);
5416
0
                        assert(svt_aom_allow_palette(pcs->ppcs->frm_hdr.allow_screen_content_tools, bsize));
5417
0
                        int rows, cols;
5418
0
                        svt_aom_get_block_dimensions(bsize, plane, blk_ptr->av1xd, NULL, NULL, &rows, &cols);
5419
0
                        pack_map_tokens(ec_writer, (const TOKENEXTRA**)(&ec_ctx->tok), palette_size_plane, rows * cols);
5420
                        // advance the pointer
5421
0
                        ec_ctx->tok = tok;
5422
0
                    }
5423
0
                }
5424
0
            }
5425
5426
0
            if (frm_hdr->tx_mode == TX_MODE_SELECT) {
5427
0
                code_tx_size(pcs,
5428
0
                             blk_org_x,
5429
0
                             blk_org_y,
5430
0
                             blk_ptr,
5431
0
                             bsize,
5432
0
                             txfm_context_array,
5433
0
                             frame_context,
5434
0
                             ec_writer,
5435
0
                             skip_coeff);
5436
0
            }
5437
0
            if (!skip_coeff) {
5438
0
                uint32_t intra_luma_mode = DC_PRED;
5439
0
                if (is_intra_mode(ec_ctx->mbmi->block_mi.mode)) {
5440
0
                    intra_luma_mode = mbmi->block_mi.mode;
5441
0
                }
5442
5443
0
                {
5444
0
                    av1_encode_coeff_1d(pcs,
5445
0
                                        ec_ctx,
5446
0
                                        frame_context,
5447
0
                                        ec_writer,
5448
0
                                        blk_ptr,
5449
0
                                        blk_org_x,
5450
0
                                        blk_org_y,
5451
0
                                        intra_luma_mode,
5452
0
                                        bsize,
5453
0
                                        coeff_ptr,
5454
0
                                        luma_dc_sign_level_coeff_na,
5455
0
                                        cr_dc_sign_level_coeff_na,
5456
0
                                        cb_dc_sign_level_coeff_na);
5457
0
                }
5458
0
            }
5459
0
        }
5460
0
    }
5461
121k
#if OPT_STATS_MUTEX
5462
121k
    ec_ctx->tot_qindex += (uint64_t)blk_ptr->qindex * bwidth * bheight;
5463
121k
    ec_ctx->valid_area += bwidth * bheight;
5464
#else
5465
    svt_block_on_mutex(pcs->entropy_coding_pic_mutex);
5466
    pcs->ppcs->tot_qindex += blk_ptr->qindex * bwidth * bheight;
5467
    pcs->ppcs->valid_qindex_area += bwidth * bheight;
5468
    svt_release_mutex(pcs->entropy_coding_pic_mutex);
5469
#endif
5470
    // Update the neighbors
5471
121k
    ec_update_neighbors(pcs, ec_ctx, blk_org_x, blk_org_y, tile_idx, bsize);
5472
5473
121k
    if (svt_av1_allow_palette(pcs->ppcs->palette_level, bsize)) {
5474
        // free ENCDEC palette info buffer
5475
0
        assert(blk_ptr->palette_info->color_idx_map != NULL && "free palette:Null");
5476
0
        EB_FREE(blk_ptr->palette_info->color_idx_map);
5477
0
        blk_ptr->palette_info->color_idx_map = NULL;
5478
0
        EB_FREE(blk_ptr->palette_info);
5479
0
    }
5480
5481
121k
    return return_error;
5482
121k
}
5483
5484
/**********************************************
5485
 * Write sb
5486
 **********************************************/
5487
void svt_aom_write_modes_sb(EntropyCodingContext* ec_ctx, SuperBlock* sb_ptr, PictureControlSet* pcs, uint16_t tile_idx,
5488
                            EntropyCoder* ec, EbPictureBufferDesc* coeff_ptr, PARTITION_TREE* ptree, int mi_row,
5489
165k
                            int mi_col) {
5490
165k
    if (mi_row >= pcs->ppcs->av1_cm->mi_rows || mi_col >= pcs->ppcs->av1_cm->mi_cols) {
5491
0
        return;
5492
0
    }
5493
165k
    FRAME_CONTEXT*     frame_context        = ec->fc;
5494
165k
    AomWriter*         ec_writer            = &ec->ec_writer;
5495
165k
    NeighborArrayUnit* partition_context_na = pcs->partition_context_na[tile_idx];
5496
5497
165k
    const BlockSize bsize = ptree->bsize;
5498
165k
    assert(bsize < BLOCK_SIZES_ALL);
5499
165k
    const int           hbs          = mi_size_wide[bsize] >> 1;
5500
165k
    const int           quarter_step = mi_size_wide[bsize] >> 2;
5501
165k
    const PartitionType partition    = ptree->partition;
5502
165k
    Av1Common*          cm           = pcs->ppcs->av1_cm;
5503
5504
165k
    if (bsize >= BLOCK_8X8) {
5505
661k
        for (int32_t plane = 0; plane < 3; ++plane) {
5506
496k
            int32_t rcol0, rcol1, rrow0, rrow1, tile_tl_idx;
5507
496k
            if (svt_av1_loop_restoration_corners_in_sb(cm,
5508
496k
                                                       &pcs->scs->seq_header,
5509
496k
                                                       plane,
5510
496k
                                                       mi_row,
5511
496k
                                                       mi_col,
5512
496k
                                                       bsize,
5513
496k
                                                       &rcol0,
5514
496k
                                                       &rcol1,
5515
496k
                                                       &rrow0,
5516
496k
                                                       &rrow1,
5517
496k
                                                       &tile_tl_idx)) {
5518
0
                const int32_t rstride = pcs->rst_info[plane].horz_units_per_tile;
5519
0
                for (int32_t rrow = rrow0; rrow < rrow1; ++rrow) {
5520
0
                    for (int32_t rcol = rcol0; rcol < rcol1; ++rcol) {
5521
0
                        const int32_t              runit_idx = tile_tl_idx + rcol + rrow * rstride;
5522
0
                        const RestorationUnitInfo* rui       = &pcs->rst_info[plane].unit_info[runit_idx];
5523
0
                        loop_restoration_write_sb_coeffs(pcs, frame_context, ec_ctx, rui, ec_writer, plane);
5524
0
                    }
5525
0
                }
5526
0
            }
5527
496k
        }
5528
5529
165k
        encode_partition_av1(pcs,
5530
165k
                             frame_context,
5531
165k
                             ec_writer,
5532
165k
                             bsize,
5533
165k
                             partition,
5534
165k
                             mi_col << MI_SIZE_LOG2,
5535
165k
                             mi_row << MI_SIZE_LOG2,
5536
165k
                             partition_context_na);
5537
165k
    }
5538
5539
165k
    assert(IMPLIES(bsize == BLOCK_4X4, partition == PARTITION_NONE));
5540
165k
    assert(IMPLIES(partition != PARTITION_SPLIT, (mi_row + hbs < cm->mi_rows) || (mi_col + hbs < cm->mi_cols)));
5541
165k
    switch (partition) {
5542
121k
    case PARTITION_NONE:
5543
121k
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[0], tile_idx, coeff_ptr, mi_row, mi_col);
5544
121k
        break;
5545
0
    case PARTITION_HORZ:
5546
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[0], tile_idx, coeff_ptr, mi_row, mi_col);
5547
0
        if (mi_row + hbs < cm->mi_rows) {
5548
0
            write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[1], tile_idx, coeff_ptr, mi_row + hbs, mi_col);
5549
0
        }
5550
0
        break;
5551
0
    case PARTITION_VERT:
5552
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[0], tile_idx, coeff_ptr, mi_row, mi_col);
5553
0
        if (mi_col + hbs < cm->mi_cols) {
5554
0
            write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[1], tile_idx, coeff_ptr, mi_row, mi_col + hbs);
5555
0
        }
5556
0
        break;
5557
44.2k
    case PARTITION_SPLIT:
5558
221k
        for (int i = 0; i < SUB_PARTITIONS_SPLIT; ++i) {
5559
177k
            const int x_idx = (i & 1) * hbs;
5560
177k
            const int y_idx = (i >> 1) * hbs;
5561
177k
            if (mi_row + y_idx >= cm->mi_rows || mi_col + x_idx >= cm->mi_cols) {
5562
17.3k
                continue;
5563
17.3k
            }
5564
159k
            svt_aom_write_modes_sb(
5565
159k
                ec_ctx, sb_ptr, pcs, tile_idx, ec, coeff_ptr, ptree->sub_tree[i], mi_row + y_idx, mi_col + x_idx);
5566
159k
        }
5567
44.2k
        break;
5568
0
    case PARTITION_HORZ_A:
5569
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[0], tile_idx, coeff_ptr, mi_row, mi_col);
5570
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[1], tile_idx, coeff_ptr, mi_row, mi_col + hbs);
5571
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[2], tile_idx, coeff_ptr, mi_row + hbs, mi_col);
5572
0
        break;
5573
0
    case PARTITION_HORZ_B:
5574
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[0], tile_idx, coeff_ptr, mi_row, mi_col);
5575
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[1], tile_idx, coeff_ptr, mi_row + hbs, mi_col);
5576
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[2], tile_idx, coeff_ptr, mi_row + hbs, mi_col + hbs);
5577
0
        break;
5578
0
    case PARTITION_VERT_A:
5579
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[0], tile_idx, coeff_ptr, mi_row, mi_col);
5580
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[1], tile_idx, coeff_ptr, mi_row + hbs, mi_col);
5581
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[2], tile_idx, coeff_ptr, mi_row, mi_col + hbs);
5582
0
        break;
5583
0
    case PARTITION_VERT_B:
5584
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[0], tile_idx, coeff_ptr, mi_row, mi_col);
5585
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[1], tile_idx, coeff_ptr, mi_row, mi_col + hbs);
5586
0
        write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[2], tile_idx, coeff_ptr, mi_row + hbs, mi_col + hbs);
5587
0
        break;
5588
0
    case PARTITION_HORZ_4:
5589
0
        for (int i = 0; i < SUB_PARTITIONS_PART4; ++i) {
5590
0
            int this_mi_row = mi_row + i * quarter_step;
5591
0
            if (i > 0 && this_mi_row >= cm->mi_rows) {
5592
                // Only the last block is able to be outside the picture boundary. If one of the first
5593
                // 3 blocks is outside the boundary, H4 is not a valid partition (see AV1 spec 5.11.4)
5594
0
                assert(i == 3);
5595
0
                break;
5596
0
            }
5597
0
            write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[i], tile_idx, coeff_ptr, this_mi_row, mi_col);
5598
0
        }
5599
0
        break;
5600
0
    case PARTITION_VERT_4:
5601
0
        for (int i = 0; i < SUB_PARTITIONS_PART4; ++i) {
5602
0
            int this_mi_col = mi_col + i * quarter_step;
5603
0
            if (i > 0 && this_mi_col >= cm->mi_cols) {
5604
                // Only the last block is able to be outside the picture boundary. If one of the first
5605
                // 3 blocks is outside the boundary, H4 is not a valid partition (see AV1 spec 5.11.4)
5606
0
                assert(i == 3);
5607
0
                break;
5608
0
            }
5609
0
            write_modes_b(pcs, ec_ctx, ec, sb_ptr, ptree->blk_data[i], tile_idx, coeff_ptr, mi_row, this_mi_col);
5610
0
        }
5611
0
        break;
5612
0
    default:
5613
        assert(0);
5614
165k
    }
5615
165k
}