/src/ffmpeg/libavcodec/rv60dec.c
Line | Count | Source |
1 | | /* |
2 | | * RV60 decoder |
3 | | * Copyright (c) 2007 Mike Melanson, Konstantin Shishkov |
4 | | * Copyright (C) 2023 Peter Ross |
5 | | * |
6 | | * This file is part of FFmpeg. |
7 | | * |
8 | | * FFmpeg is free software; you can redistribute it and/or |
9 | | * modify it under the terms of the GNU Lesser General Public |
10 | | * License as published by the Free Software Foundation; either |
11 | | * version 2.1 of the License, or (at your option) any later version. |
12 | | * |
13 | | * FFmpeg is distributed in the hope that it will be useful, |
14 | | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
15 | | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
16 | | * Lesser General Public License for more details. |
17 | | * |
18 | | * You should have received a copy of the GNU Lesser General Public |
19 | | * License along with FFmpeg; if not, write to the Free Software |
20 | | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
21 | | */ |
22 | | |
23 | | #include "avcodec.h" |
24 | | #include "codec_internal.h" |
25 | | #include "decode.h" |
26 | | #include "get_bits.h" |
27 | | #include "golomb.h" |
28 | | #include "libavutil/mem.h" |
29 | | #include "rv60data.h" |
30 | | #include "rv60dsp.h" |
31 | | #include "rv60vlcs.h" |
32 | | #include "threadprogress.h" |
33 | | #include "unary.h" |
34 | | #include "videodsp.h" |
35 | | |
36 | | #include "libavutil/attributes.h" |
37 | | |
38 | | static const int8_t frame_types[4] = {AV_PICTURE_TYPE_I, AV_PICTURE_TYPE_P, AV_PICTURE_TYPE_B, AV_PICTURE_TYPE_NONE}; |
39 | | |
40 | | enum CUType { |
41 | | CU_INTRA = 0, |
42 | | CU_INTER_MV, |
43 | | CU_SKIP, |
44 | | CU_INTER |
45 | | }; |
46 | | |
47 | | enum PUType { |
48 | | PU_FULL = 0, |
49 | | PU_N2HOR, |
50 | | PU_N2VER, |
51 | | PU_QUARTERS, |
52 | | PU_N4HOR, |
53 | | PU_N34HOR, |
54 | | PU_N4VER, |
55 | | PU_N34VER |
56 | | }; |
57 | | |
58 | | enum IntraMode { |
59 | | INTRAMODE_INDEX = 0, |
60 | | INTRAMODE_DC64, |
61 | | INTRAMODE_PLANE64, |
62 | | INTRAMODE_MODE |
63 | | }; |
64 | | |
65 | | enum MVRefEnum { |
66 | | MVREF_NONE = 0, |
67 | | MVREF_REF0, |
68 | | MVREF_REF1, |
69 | | MVREF_BREF, |
70 | | MVREF_REF0ANDBREF, |
71 | | MVREF_SKIP0, |
72 | | MVREF_SKIP1, |
73 | | MVREF_SKIP2, |
74 | | MVREF_SKIP3 |
75 | | }; |
76 | | |
77 | | static const uint8_t skip_mv_ref[4] = {MVREF_SKIP0, MVREF_SKIP1, MVREF_SKIP2, MVREF_SKIP3}; |
78 | | |
79 | | enum { |
80 | | TRANSFORM_NONE = 0, |
81 | | TRANSFORM_16X16, |
82 | | TRANSFORM_8X8, |
83 | | TRANSFORM_4X4 |
84 | | }; |
85 | | |
86 | | static const VLCElem * cbp8_vlc[7][4]; |
87 | | static const VLCElem * cbp16_vlc[7][4][4]; |
88 | | |
89 | | typedef struct { |
90 | | const VLCElem * l0[2]; |
91 | | const VLCElem * l12[2]; |
92 | | const VLCElem * l3[2]; |
93 | | const VLCElem * esc; |
94 | | } CoeffVLCs; |
95 | | |
96 | | static CoeffVLCs intra_coeff_vlc[5]; |
97 | | static CoeffVLCs inter_coeff_vlc[7]; |
98 | | |
99 | | #define MAX_VLC_SIZE 864 |
100 | | static VLCElem table_data[129148]; |
101 | | |
102 | | /* 32-bit version of rv34_gen_vlc */ |
103 | | static const VLCElem * gen_vlc(const uint8_t * bits, int size, VLCInitState * state) |
104 | 196 | { |
105 | 196 | int counts[17] = {0}; |
106 | 196 | uint32_t codes[18]; |
107 | 196 | uint32_t cw[MAX_VLC_SIZE]; |
108 | | |
109 | 33.6k | for (int i = 0; i < size; i++) |
110 | 33.4k | counts[bits[i]]++; |
111 | | |
112 | 196 | codes[0] = counts[0] = 0; |
113 | 3.52k | for (int i = 0; i < 17; i++) |
114 | 3.33k | codes[i+1] = (codes[i] + counts[i]) << 1; |
115 | | |
116 | 33.6k | for (int i = 0; i < size; i++) |
117 | 33.4k | cw[i] = codes[bits[i]]++; |
118 | | |
119 | 196 | return ff_vlc_init_tables(state, 9, size, |
120 | 196 | bits, 1, 1, |
121 | 196 | cw, 4, 4, 0); |
122 | 196 | } |
123 | | |
124 | | static void build_coeff_vlc(const CoeffLens * lens, CoeffVLCs * vlc, int count, VLCInitState * state) |
125 | 2 | { |
126 | 14 | for (int i = 0; i < count; i++) { |
127 | 36 | for (int j = 0; j < 2; j++) { |
128 | 24 | vlc[i].l0[j] = gen_vlc(lens[i].l0[j], 864, state); |
129 | 24 | vlc[i].l12[j] = gen_vlc(lens[i].l12[j], 108, state); |
130 | 24 | vlc[i].l3[j] = gen_vlc(lens[i].l3[j], 108, state); |
131 | 24 | } |
132 | 12 | vlc[i].esc = gen_vlc(lens[i].esc, 32, state); |
133 | 12 | } |
134 | 2 | } |
135 | | |
136 | | static av_cold void rv60_init_static_data(void) |
137 | 1 | { |
138 | 1 | VLCInitState state = VLC_INIT_STATE(table_data); |
139 | | |
140 | 8 | for (int i = 0; i < 7; i++) |
141 | 35 | for (int j = 0; j < 4; j++) |
142 | 28 | cbp16_vlc[i][0][j] = cbp8_vlc[i][j] = gen_vlc(rv60_cbp8_lens[i][j], 64, &state); |
143 | | |
144 | 8 | for (int i = 0; i < 7; i++) |
145 | 28 | for (int j = 0; j < 3; j++) |
146 | 105 | for (int k = 0; k < 4; k++) |
147 | 84 | cbp16_vlc[i][j + 1][k] = gen_vlc(rv60_cbp16_lens[i][j][k], 64, &state); |
148 | | |
149 | 1 | build_coeff_vlc(rv60_intra_lens, intra_coeff_vlc, 5, &state); |
150 | 1 | build_coeff_vlc(rv60_inter_lens, inter_coeff_vlc, 7, &state); |
151 | 1 | } |
152 | | |
153 | | typedef struct { |
154 | | int sign; |
155 | | int size; |
156 | | const uint8_t * data; |
157 | | int data_size; |
158 | | } Slice; |
159 | | |
160 | | typedef struct { |
161 | | int cu_split_pos; |
162 | | uint8_t cu_split[1+4+16+64]; |
163 | | |
164 | | uint8_t coded_blk[64]; |
165 | | |
166 | | uint8_t avg_buffer[64*64 + 32*32*2]; |
167 | | uint8_t * avg_data[3]; |
168 | | int avg_linesize[3]; |
169 | | } ThreadContext; |
170 | | |
171 | | typedef struct { |
172 | | int16_t x; |
173 | | int16_t y; |
174 | | } MV; |
175 | | |
176 | | typedef struct { |
177 | | enum MVRefEnum mvref; |
178 | | MV f_mv; |
179 | | MV b_mv; |
180 | | } MVInfo; |
181 | | |
182 | | typedef struct { |
183 | | enum IntraMode imode; |
184 | | MVInfo mv; |
185 | | } BlockInfo; |
186 | | |
187 | | typedef struct { |
188 | | enum CUType cu_type; |
189 | | enum PUType pu_type; |
190 | | } PUInfo; |
191 | | |
192 | | typedef struct RV60Context { |
193 | | AVCodecContext * avctx; |
194 | | VideoDSPContext vdsp; |
195 | | |
196 | 516k | #define CUR_PIC 0 |
197 | 18.1M | #define LAST_PIC 1 |
198 | 734k | #define NEXT_PIC 2 |
199 | | AVFrame *last_frame[3]; |
200 | | |
201 | | int pict_type; |
202 | | int qp; |
203 | | int osvquant; |
204 | | int ts; |
205 | | int two_f_refs; |
206 | | int qp_off_type; |
207 | | int deblock; |
208 | | int deblock_chroma; |
209 | | int awidth; |
210 | | int aheight; |
211 | | int cu_width; |
212 | | int cu_height; |
213 | | |
214 | | Slice * slice; |
215 | | |
216 | | int pu_stride; |
217 | | PUInfo * pu_info; |
218 | | |
219 | | int blk_stride; |
220 | | BlockInfo * blk_info; |
221 | | |
222 | | int dblk_stride; |
223 | | uint8_t * left_str; |
224 | | uint8_t * top_str; |
225 | | |
226 | | uint64_t ref_pts[2], ts_scale; |
227 | | uint32_t ref_ts[2]; |
228 | | |
229 | | struct ThreadProgress *progress; |
230 | | unsigned nb_progress; |
231 | | } RV60Context; |
232 | | |
233 | | static int progress_init(RV60Context *s, unsigned count) |
234 | 96.0k | { |
235 | 96.0k | if (s->nb_progress < count) { |
236 | 5.05k | void *tmp = av_realloc_array(s->progress, count, sizeof(*s->progress)); |
237 | 5.05k | if (!tmp) |
238 | 0 | return AVERROR(ENOMEM); |
239 | 5.05k | s->progress = tmp; |
240 | 5.05k | memset(s->progress + s->nb_progress, 0, (count - s->nb_progress) * sizeof(*s->progress)); |
241 | 28.7k | for (int i = s->nb_progress; i < count; i++) { |
242 | 23.7k | int ret = ff_thread_progress_init(&s->progress[i], 1); |
243 | 23.7k | if (ret < 0) |
244 | 0 | return ret; |
245 | 23.7k | s->nb_progress = i + 1; |
246 | 23.7k | } |
247 | 5.05k | } |
248 | | |
249 | 235k | for (int i = 0; i < count; i++) |
250 | 139k | ff_thread_progress_reset(&s->progress[i]); |
251 | | |
252 | 96.0k | return 0; |
253 | 96.0k | } |
254 | | |
255 | | static av_cold int rv60_decode_init(AVCodecContext * avctx) |
256 | 5.59k | { |
257 | 5.59k | static AVOnce init_static_once = AV_ONCE_INIT; |
258 | 5.59k | RV60Context *s = avctx->priv_data; |
259 | | |
260 | 5.59k | s->avctx = avctx; |
261 | | |
262 | 5.59k | ff_videodsp_init(&s->vdsp, 8); |
263 | | |
264 | 5.59k | avctx->pix_fmt = AV_PIX_FMT_YUV420P; |
265 | | |
266 | 22.3k | for (int i = 0; i < 3; i++) { |
267 | 16.7k | s->last_frame[i] = av_frame_alloc(); |
268 | 16.7k | if (!s->last_frame[i]) |
269 | 0 | return AVERROR(ENOMEM); |
270 | 16.7k | } |
271 | | |
272 | 5.59k | ff_thread_once(&init_static_once, rv60_init_static_data); |
273 | | |
274 | 5.59k | return 0; |
275 | 5.59k | } |
276 | | |
277 | | static int update_dimensions_clear_info(RV60Context *s, int width, int height) |
278 | 112k | { |
279 | 112k | int ret; |
280 | | |
281 | 112k | if (width != s->avctx->width || height != s->avctx->height) { |
282 | | |
283 | 26.5k | av_log(s->avctx, AV_LOG_INFO, "changing dimensions to %dx%d\n", width, height); |
284 | | |
285 | 106k | for (int i = 0; i < 3; i++) |
286 | 79.6k | av_frame_unref(s->last_frame[i]); |
287 | | |
288 | 26.5k | if ((ret = ff_set_dimensions(s->avctx, width, height)) < 0) |
289 | 8.42k | return ret; |
290 | | |
291 | 18.1k | if (s->avctx->width <= 64 || s->avctx->height <= 64) |
292 | 13.0k | av_log(s->avctx, AV_LOG_WARNING, "unable to faithfully reproduce emulated edges; expect visual artefacts\n"); |
293 | 18.1k | } |
294 | | |
295 | 103k | s->awidth = FFALIGN(width, 16); |
296 | 103k | s->aheight = FFALIGN(height, 16); |
297 | | |
298 | 103k | s->cu_width = (width + 63) >> 6; |
299 | 103k | s->cu_height = (height + 63) >> 6; |
300 | | |
301 | 103k | s->pu_stride = s->cu_width << 3; |
302 | 103k | s->blk_stride = s->cu_width << 4; |
303 | | |
304 | 103k | if ((ret = av_reallocp_array(&s->slice, s->cu_height, sizeof(s->slice[0]))) < 0) |
305 | 0 | return ret; |
306 | | |
307 | 103k | if ((ret = av_reallocp_array(&s->pu_info, s->pu_stride * (s->cu_height << 3), sizeof(s->pu_info[0]))) < 0) |
308 | 0 | return ret; |
309 | | |
310 | 103k | if ((ret = av_reallocp_array(&s->blk_info, s->blk_stride * (s->cu_height << 4), sizeof(s->blk_info[0]))) < 0) |
311 | 0 | return ret; |
312 | | |
313 | 103k | memset(s->pu_info, 0, s->pu_stride * (s->cu_height << 3) * sizeof(s->pu_info[0])); |
314 | 103k | memset(s->blk_info, 0, s->blk_stride * (s->cu_height << 4) * sizeof(s->blk_info[0])); |
315 | | |
316 | 6.11M | for (int j = 0; j < s->cu_height << 4; j++) |
317 | 2.52G | for (int i = 0; i < s->cu_width << 4; i++) |
318 | 2.51G | s->blk_info[j*s->blk_stride + i].mv.mvref = MVREF_NONE; |
319 | | |
320 | 103k | if (s->deblock) { |
321 | 20.2k | int size; |
322 | | |
323 | 20.2k | s->dblk_stride = s->awidth >> 2; |
324 | | |
325 | 20.2k | size = s->dblk_stride * (s->aheight >> 2); |
326 | | |
327 | 20.2k | if ((ret = av_reallocp_array(&s->top_str, size, sizeof(s->top_str[0]))) < 0) |
328 | 0 | return ret; |
329 | | |
330 | 20.2k | if ((ret = av_reallocp_array(&s->left_str, size, sizeof(s->left_str[0]))) < 0) |
331 | 0 | return ret; |
332 | | |
333 | 20.2k | memset(s->top_str, 0, size); |
334 | 20.2k | memset(s->left_str, 0, size); |
335 | 20.2k | } |
336 | | |
337 | 103k | return 0; |
338 | 103k | } |
339 | | |
340 | | static int read_code012(GetBitContext * gb) |
341 | 9.33M | { |
342 | 9.33M | if (!get_bits1(gb)) |
343 | 889k | return 0; |
344 | 8.44M | return get_bits1(gb) + 1; |
345 | 9.33M | } |
346 | | |
347 | | static int read_frame_header(RV60Context *s, GetBitContext *gb, int * width, int * height) |
348 | 175k | { |
349 | 175k | if (get_bits(gb, 2) != 3) |
350 | 19.8k | return AVERROR_INVALIDDATA; |
351 | | |
352 | 155k | skip_bits(gb, 2); |
353 | 155k | skip_bits(gb, 4); |
354 | | |
355 | 155k | s->pict_type = frame_types[get_bits(gb, 2)]; |
356 | 155k | if (s->pict_type == AV_PICTURE_TYPE_NONE) |
357 | 2.51k | return AVERROR_INVALIDDATA; |
358 | | |
359 | 152k | s->qp = get_bits(gb, 6); |
360 | 152k | skip_bits1(gb); |
361 | 152k | skip_bits(gb, 2); |
362 | 152k | s->osvquant = get_bits(gb, 2); |
363 | 152k | skip_bits1(gb); |
364 | 152k | skip_bits(gb, 2); |
365 | 152k | s->ts = get_bits(gb, 24); |
366 | 152k | *width = (get_bits(gb, 11) + 1) * 4; |
367 | 152k | *height = get_bits(gb, 11) * 4; |
368 | 152k | skip_bits1(gb); |
369 | 152k | if (s->pict_type == AV_PICTURE_TYPE_I) { |
370 | 109k | s->two_f_refs = 0; |
371 | 109k | } else { |
372 | 42.9k | if (get_bits1(gb)) |
373 | 3.86k | skip_bits(gb, 3); |
374 | 42.9k | s->two_f_refs = get_bits1(gb); |
375 | 42.9k | } |
376 | 152k | read_code012(gb); |
377 | 152k | read_code012(gb); |
378 | 152k | s->qp_off_type = read_code012(gb); |
379 | 152k | s->deblock = get_bits1(gb); |
380 | 152k | s->deblock_chroma = s->deblock && !get_bits1(gb); |
381 | | |
382 | 152k | if (get_bits1(gb)) { |
383 | 13.7k | int count = get_bits(gb, 2); |
384 | 13.7k | if (count) { |
385 | 10.5k | skip_bits(gb, 2); |
386 | 33.8k | for (int i = 0; i < count; i++) |
387 | 119k | for (int j = 0; j < 2 << i; j++) |
388 | 96.2k | skip_bits(gb, 8); |
389 | 10.5k | } |
390 | 13.7k | } |
391 | | |
392 | 152k | return 0; |
393 | 155k | } |
394 | | |
395 | | static int read_slice_sizes(RV60Context *s, GetBitContext *gb) |
396 | 103k | { |
397 | 103k | int nbits = get_bits(gb, 5) + 1; |
398 | 103k | int last_size; |
399 | | |
400 | 473k | for (int i = 0; i < s->cu_height; i++) |
401 | 369k | s->slice[i].sign = get_bits1(gb); |
402 | | |
403 | 103k | s->slice[0].size = last_size = get_bits_long(gb, nbits); |
404 | | |
405 | 103k | if (last_size < 0) |
406 | 458 | return AVERROR_INVALIDDATA; |
407 | | |
408 | 168k | for (int i = 1; i < s->cu_height; i++) { |
409 | 71.5k | int diff = get_bits_long(gb, nbits); |
410 | 71.5k | if (s->slice[i].sign) |
411 | 42.1k | last_size += diff; |
412 | 29.3k | else |
413 | 29.3k | last_size -= diff; |
414 | 71.5k | if (last_size <= 0) |
415 | 6.20k | return AVERROR_INVALIDDATA; |
416 | 65.3k | s->slice[i].size = last_size; |
417 | 65.3k | } |
418 | | |
419 | 97.1k | align_get_bits(gb); |
420 | 97.1k | return 0; |
421 | 103k | } |
422 | | |
423 | | static int read_intra_mode(GetBitContext * gb, int * param) |
424 | 9.51M | { |
425 | 9.51M | if (get_bits1(gb)) { |
426 | 8.52M | *param = read_code012(gb); |
427 | 8.52M | return INTRAMODE_INDEX; |
428 | 8.52M | } else { |
429 | 991k | *param = get_bits(gb, 5); |
430 | 991k | return INTRAMODE_MODE; |
431 | 991k | } |
432 | 9.51M | } |
433 | | |
434 | | static int has_top_block(const RV60Context * s, int xpos, int ypos, int dx, int dy, int size) |
435 | 24.0M | { |
436 | 24.0M | return ypos + dy && xpos + dx + size <= s->awidth; |
437 | 24.0M | } |
438 | | |
439 | | static int has_left_block(const RV60Context * s, int xpos, int ypos, int dx, int dy, int size) |
440 | 25.5M | { |
441 | 25.5M | return xpos + dx && ypos + dy + size <= s->aheight; |
442 | 25.5M | } |
443 | | |
444 | | static int has_top_right_block(const RV60Context * s, int xpos, int ypos, int dx, int dy, int size) |
445 | 13.7M | { |
446 | 13.7M | if (has_top_block(s, xpos, ypos, dx, dy, size * 2)) { |
447 | 13.2M | int cxpos = ((xpos + dx) & 63) >> ff_log2(size); |
448 | 13.2M | int cypos = ((ypos + dy) & 63) >> ff_log2(size); |
449 | 13.2M | return !(rv60_avail_mask[cxpos] & cypos); |
450 | 13.2M | } |
451 | 442k | return 0; |
452 | 13.7M | } |
453 | | |
454 | | static int has_left_down_block(const RV60Context * s, int xpos, int ypos, int dx, int dy, int size) |
455 | 16.0M | { |
456 | 16.0M | if (has_left_block(s, xpos, ypos, dx, dy, size * 2)) { |
457 | 13.3M | int cxpos = (~(xpos + dx) & 63) >> ff_log2(size); |
458 | 13.3M | int cypos = (~(ypos + dy) & 63) >> ff_log2(size); |
459 | 13.3M | return rv60_avail_mask[cxpos] & cypos; |
460 | 13.3M | } |
461 | 2.67M | return 0; |
462 | 16.0M | } |
463 | | |
464 | | typedef struct { |
465 | | uint8_t t[129]; |
466 | | uint8_t l[129]; |
467 | | int has_t; |
468 | | int has_tr; |
469 | | int has_l; |
470 | | int has_ld; |
471 | | } IntraPredContext; |
472 | | |
473 | | typedef struct { |
474 | | int xpos; |
475 | | int ypos; |
476 | | int pu_pos; |
477 | | int blk_pos; |
478 | | |
479 | | enum CUType cu_type; |
480 | | enum PUType pu_type; |
481 | | enum IntraMode imode[4]; |
482 | | int imode_param[4]; |
483 | | MVInfo mv[4]; |
484 | | |
485 | | IntraPredContext ipred; |
486 | | } CUContext; |
487 | | |
488 | | static void ipred_init(IntraPredContext * i) |
489 | 16.4M | { |
490 | 16.4M | memset(i->t, 0x80, sizeof(i->t)); |
491 | 16.4M | memset(i->l, 0x80, sizeof(i->l)); |
492 | 16.4M | i->has_t = i->has_tr = i->has_l = i->has_ld = 0; |
493 | 16.4M | } |
494 | | |
495 | | static void populate_ipred(const RV60Context * s, CUContext * cu, const uint8_t * src, int stride, int xoff, int yoff, int size, int is_luma) |
496 | 16.4M | { |
497 | 16.4M | if (is_luma) |
498 | 9.70M | src += (cu->ypos + yoff) * stride + cu->xpos + xoff; |
499 | 6.72M | else |
500 | 6.72M | src += (cu->ypos >> 1) * stride + (cu->xpos >> 1); |
501 | | |
502 | 16.4M | ipred_init(&cu->ipred); |
503 | | |
504 | 16.4M | if (cu->ypos + yoff > 0) { |
505 | 13.7M | cu->ipred.has_t = 1; |
506 | | |
507 | 13.7M | memcpy(cu->ipred.t + 1, src - stride, size); |
508 | | |
509 | 13.7M | if ((is_luma && has_top_right_block(s, cu->xpos, cu->ypos, xoff, yoff, size)) || |
510 | 8.90M | (!is_luma && has_top_right_block(s, cu->xpos, cu->ypos, 0, 0, size << 1))) { |
511 | 8.90M | cu->ipred.has_tr = 1; |
512 | 8.90M | memcpy(cu->ipred.t + size + 1, src - stride + size, size); |
513 | 8.90M | } else |
514 | 4.80M | memset(cu->ipred.t + size + 1, cu->ipred.t[size], size); |
515 | | |
516 | 13.7M | if (cu->xpos + xoff > 0) |
517 | 13.5M | cu->ipred.t[0] = src[-stride - 1]; |
518 | 13.7M | } |
519 | | |
520 | 16.4M | if (cu->xpos + xoff > 0) { |
521 | 16.0M | cu->ipred.has_l = 1; |
522 | | |
523 | 147M | for (int y = 0; y < size; y++) |
524 | 131M | cu->ipred.l[y + 1] = src[y*stride - 1]; |
525 | | |
526 | 16.0M | if ((is_luma && has_left_down_block(s, cu->xpos, cu->ypos, xoff, yoff, size)) || |
527 | 13.1M | (!is_luma && has_left_down_block(s, cu->xpos, cu->ypos, 0, 0, size << 1))) { |
528 | 4.49M | cu->ipred.has_ld = 1; |
529 | 24.6M | for (int y = size; y < size * 2; y++) |
530 | 20.1M | cu->ipred.l[y + 1] = src[y*stride - 1]; |
531 | 4.49M | } else |
532 | 11.5M | memset(cu->ipred.l + size + 1, cu->ipred.l[size], size); |
533 | | |
534 | 16.0M | if (cu->ypos + yoff > 0) |
535 | 13.5M | cu->ipred.l[0] = src[-stride - 1]; |
536 | 16.0M | } |
537 | 16.4M | } |
538 | | |
539 | | static void pred_plane(const IntraPredContext * p, uint8_t * dst, int stride, int size) |
540 | 5.66M | { |
541 | 5.66M | int lastl = p->l[size + 1]; |
542 | 5.66M | int lastt = p->t[size + 1]; |
543 | 5.66M | int tmp1[64], tmp2[64]; |
544 | 5.66M | int top_ref[64], left_ref[64]; |
545 | 5.66M | int shift; |
546 | | |
547 | 29.5M | for (int i = 0; i < size; i++) { |
548 | 23.8M | tmp1[i] = lastl - p->t[i + 1]; |
549 | 23.8M | tmp2[i] = lastt - p->l[i + 1]; |
550 | 23.8M | } |
551 | | |
552 | 5.66M | shift = ff_log2(size) + 1; |
553 | 29.5M | for (int i = 0; i < size; i++) { |
554 | 23.8M | top_ref[i] = p->t[i + 1] << (shift - 1); |
555 | 23.8M | left_ref[i] = p->l[i + 1] << (shift - 1); |
556 | 23.8M | } |
557 | | |
558 | 29.5M | for (int y = 0; y < size; y++) { |
559 | 23.8M | int add = tmp2[y]; |
560 | 23.8M | int sum = left_ref[y] + size; |
561 | 154M | for (int x = 0; x < size; x++) { |
562 | 130M | int v = tmp1[x] + top_ref[x]; |
563 | 130M | sum += add; |
564 | 130M | top_ref[x] = v; |
565 | 130M | dst[y*stride + x] = (sum + v) >> shift; |
566 | 130M | } |
567 | 23.8M | } |
568 | 5.66M | } |
569 | | |
570 | | static void pred_dc(const IntraPredContext * p, uint8_t * dst, int stride, int size, int filter) |
571 | 4.92M | { |
572 | 4.92M | int dc; |
573 | | |
574 | 4.92M | if (!p->has_t && !p->has_l) |
575 | 22.7k | dc = 0x80; |
576 | 4.89M | else { |
577 | 4.89M | int sum = 0; |
578 | 4.89M | if (p->has_t) |
579 | 36.2M | for (int x = 0; x < size; x++) |
580 | 32.5M | sum += p->t[x + 1]; |
581 | 4.89M | if (p->has_l) |
582 | 74.5M | for (int y = 0; y < size; y++) |
583 | 69.7M | sum += p->l[y + 1]; |
584 | 4.89M | if (p->has_t && p->has_l) |
585 | 3.66M | dc = (sum + size) / (size * 2); |
586 | 1.22M | else |
587 | 1.22M | dc = (sum + size / 2) / size; |
588 | 4.89M | } |
589 | | |
590 | 76.4M | for (int y = 0; y < size; y++) |
591 | 71.4M | memset(dst + y*stride, dc, size); |
592 | | |
593 | 4.92M | if (filter && p->has_t && p->has_l) { |
594 | 3.16M | dst[0] = (p->t[1] + p->l[1] + 2 * dst[0] + 2) >> 2; |
595 | 21.4M | for (int x = 1; x < size; x++) |
596 | 18.3M | dst[x] = (p->t[x + 1] + 3 * dst[x] + 2) >> 2; |
597 | 21.4M | for (int y = 1; y < size; y++) |
598 | 18.3M | dst[y*stride] = (p->l[y + 1] + 3 * dst[y*stride] + 2) >> 2; |
599 | 3.16M | } |
600 | 4.92M | } |
601 | | |
602 | | static void filter_weak(uint8_t * dst, const uint8_t * src, int size) |
603 | 5.32M | { |
604 | 5.32M | dst[0] = src[0]; |
605 | 40.8M | for (int i = 1; i < size - 1; i++) |
606 | 35.5M | dst[i] = (src[i - 1] + 2*src[i] + src[i + 1] + 2) >> 2; |
607 | 5.32M | dst[size - 1] = src[size - 1]; |
608 | 5.32M | } |
609 | | |
610 | | static void filter_bilin32(uint8_t * dst, int v0, int v1, int size) |
611 | 427k | { |
612 | 427k | int diff = v1 - v0; |
613 | 427k | int sum = (v0 << 5) + (1 << (5 - 1)); |
614 | 12.8M | for (int i = 0; i < size; i++) { |
615 | 12.4M | dst[i] = sum >> 5; |
616 | 12.4M | sum += diff; |
617 | 12.4M | } |
618 | 427k | } |
619 | | |
620 | | static void pred_hor_angle(uint8_t * dst, int stride, int size, int weight, const uint8_t * src) |
621 | 1.74M | { |
622 | 1.74M | int sum = 0; |
623 | 24.7M | for (int x = 0; x < size; x++) { |
624 | 23.0M | int off, frac; |
625 | 23.0M | sum += weight; |
626 | 23.0M | off = (sum >> 5) + 32; |
627 | 23.0M | frac = sum & 0x1F; |
628 | 23.0M | if (!frac) |
629 | 204M | for (int y = 0; y < size; y++) |
630 | 193M | dst[y*stride + x] = src[off + y]; |
631 | 12.6M | else { |
632 | 235M | for (int y = 0; y < size; y++) { |
633 | 222M | int a = src[off + y]; |
634 | 222M | int b = src[off + y + 1]; |
635 | 222M | dst[y*stride + x] = ((32 - frac) * a + frac * b + 16) >> 5; |
636 | 222M | } |
637 | 12.6M | } |
638 | 23.0M | } |
639 | 1.74M | } |
640 | | |
641 | | static void pred_ver_angle(uint8_t * dst, int stride, int size, int weight, const uint8_t * src) |
642 | 377k | { |
643 | 377k | int sum = 0; |
644 | 3.23M | for (int y = 0; y < size; y++) { |
645 | 2.85M | int off, frac; |
646 | 2.85M | sum += weight; |
647 | 2.85M | off = (sum >> 5) + 32; |
648 | 2.85M | frac = sum & 0x1F; |
649 | 2.85M | if (!frac) |
650 | 669k | memcpy(dst + y*stride, src + off, size); |
651 | 2.18M | else { |
652 | 31.9M | for (int x = 0; x < size; x++) { |
653 | 29.7M | int a = src[off + x]; |
654 | 29.7M | int b = src[off + x + 1]; |
655 | 29.7M | dst[y*stride + x] = ((32 - frac) * a + frac * b + 16) >> 5; |
656 | 29.7M | } |
657 | 2.18M | } |
658 | 2.85M | } |
659 | 377k | } |
660 | | |
661 | | static int pred_angle(const IntraPredContext * p, uint8_t * dst, int stride, int size, int imode, int filter) |
662 | 16.4M | { |
663 | 16.4M | uint8_t filtered1[96], filtered2[96]; |
664 | | |
665 | 16.4M | if (!imode) { |
666 | 5.66M | pred_plane(p, dst, stride, size); |
667 | 10.7M | } else if (imode == 1) { |
668 | 4.92M | pred_dc(p, dst, stride, size, filter); |
669 | 5.84M | } else if (imode <= 9) { |
670 | 1.57M | int ang_weight = rv60_ipred_angle[10 - imode]; |
671 | 1.57M | int add_size = (size * ang_weight + 31) >> 5; |
672 | 1.57M | if (size <= 16) { |
673 | 1.38M | filter_weak(filtered1 + 32, &p->l[1], size + add_size); |
674 | 1.38M | } else { |
675 | 187k | filter_bilin32(filtered1 + 32, p->l[1], p->l[33], 32); |
676 | 187k | filter_bilin32(filtered1 + 64, p->l[32], p->l[64], add_size); |
677 | 187k | } |
678 | 1.57M | pred_hor_angle(dst, stride, size, ang_weight, filtered1); |
679 | 4.26M | } else if (imode == 10) { |
680 | 3.67M | if (size <= 16) |
681 | 3.67M | filter_weak(filtered1 + 32, &p->l[1], size); |
682 | 4.79k | else |
683 | 4.79k | filter_bilin32(filtered1 + 32, p->l[1], p->l[33], 32); |
684 | 18.7M | for (int y = 0; y < size; y++) |
685 | 82.6M | for (int x = 0; x < size; x++) |
686 | 67.5M | dst[y*stride + x] = filtered1[32 + y]; |
687 | 3.67M | if (filter) { |
688 | 3.20M | int tl = p->t[0]; |
689 | 16.2M | for (int x = 0; x < size; x++) |
690 | 13.0M | dst[x] = av_clip_uint8(dst[x] + ((p->t[x + 1] - tl) >> 1)); |
691 | 3.20M | } |
692 | 3.67M | } else if (imode <= 17) { |
693 | 169k | int ang_weight = rv60_ipred_angle[imode - 10]; |
694 | 169k | int inv_angle = rv60_ipred_inv_angle[imode - 10]; |
695 | 169k | int add_size = (size * ang_weight + 31) >> 5; |
696 | 169k | if (size <= 16) { |
697 | 161k | memcpy(filtered1 + 32 - 1, p->l, size + 1); |
698 | 161k | memcpy(filtered2 + 32 - 1, p->t, size + 1); |
699 | 161k | } else { |
700 | 7.92k | filtered1[32 - 1] = p->l[0]; |
701 | 7.92k | filter_bilin32(filtered1 + 32, p->l[0], p->l[32], 32); |
702 | 7.92k | filtered2[32 - 1] = p->t[0]; |
703 | 7.92k | filter_bilin32(filtered2 + 32, p->t[0], p->t[32], 32); |
704 | 7.92k | } |
705 | 169k | if (add_size > 1) { |
706 | 135k | int sum = 0x80; |
707 | 667k | for (int i = 1; i < add_size; i++) { |
708 | 532k | sum += inv_angle; |
709 | 532k | filtered1[32 - 1 - i] = filtered2[32 - 1 + (sum >> 8)]; |
710 | 532k | } |
711 | 135k | } |
712 | 169k | pred_hor_angle(dst, stride, size, -ang_weight, filtered1); |
713 | 421k | } else if (imode <= 25) { |
714 | 141k | int ang_weight = rv60_ipred_angle[26 - imode]; |
715 | 141k | int inv_angle = rv60_ipred_inv_angle[26 - imode]; |
716 | 141k | int add_size = (size * ang_weight + 31) >> 5; |
717 | 141k | if (size <= 16) { |
718 | 135k | memcpy(filtered1 + 32 - 1, p->t, size + 1); |
719 | 135k | memcpy(filtered2 + 32 - 1, p->l, size + 1); |
720 | 135k | } else { |
721 | 6.30k | filtered1[32 - 1] = p->t[0]; |
722 | 6.30k | filter_bilin32(filtered1 + 32, p->t[0], p->t[32], 32); |
723 | 6.30k | filtered2[32 - 1] = p->l[0]; |
724 | 6.30k | filter_bilin32(filtered2 + 32, p->l[0], p->l[32], 32); |
725 | 6.30k | } |
726 | 141k | if (add_size > 1) { |
727 | 100k | int sum = 0x80; |
728 | 603k | for (int i = 1; i < add_size; i++) { |
729 | 503k | sum += inv_angle; |
730 | 503k | filtered1[32 - 1 - i] = filtered2[32 - 1 + (sum >> 8)]; |
731 | 503k | } |
732 | 100k | } |
733 | 141k | pred_ver_angle(dst, stride, size, -ang_weight, filtered1); |
734 | 279k | } else if (imode == 26) { |
735 | 43.5k | if (size <= 16) |
736 | 42.2k | filter_weak(&filtered1[32], &p->t[1], size); |
737 | 1.31k | else |
738 | 1.31k | filter_bilin32(filtered1 + 32, p->t[1], p->t[33], 32); |
739 | 425k | for (int i = 0; i < size; i++) |
740 | 381k | memcpy(dst + i*stride, filtered1 + 32, size); |
741 | 43.5k | if (filter) { |
742 | 17.3k | int tl = p->l[0]; |
743 | 214k | for (int y = 0; y < size; y++) |
744 | 197k | dst[y*stride] = av_clip_uint8(dst[y*stride] + ((p->l[y+1] - tl) >> 1)); |
745 | 17.3k | } |
746 | 235k | } else if (imode <= 34) { |
747 | 235k | int ang_weight = rv60_ipred_angle[imode - 26]; |
748 | 235k | int add_size = (size * ang_weight + 31) >> 5; |
749 | 235k | if (size <= 16) |
750 | 226k | filter_weak(&filtered1[32], &p->t[1], size + add_size); |
751 | 9.05k | else { |
752 | 9.05k | filter_bilin32(filtered1 + 32, p->t[1], p->t[33], 32); |
753 | 9.05k | filter_bilin32(filtered1 + 64, p->t[32], p->t[64], add_size); |
754 | 9.05k | } |
755 | 235k | pred_ver_angle(dst, stride, size, ang_weight, filtered1); |
756 | 235k | } else |
757 | 0 | return AVERROR_INVALIDDATA; |
758 | 16.4M | return 0; |
759 | 16.4M | } |
760 | | |
761 | | static int pu_is_intra(const PUInfo * pu) |
762 | 25.8M | { |
763 | 25.8M | return pu->cu_type == CU_INTRA; |
764 | 25.8M | } |
765 | | |
766 | | static int ipm_compar(const void * a, const void * b) |
767 | 2.64M | { |
768 | 2.64M | return *(const enum IntraMode *)a - *(const enum IntraMode *)b; |
769 | 2.64M | } |
770 | | |
771 | | #define MK_UNIQUELIST(name, type, max_size) \ |
772 | | typedef struct { \ |
773 | | type list[max_size]; \ |
774 | | int size; \ |
775 | | } unique_list_##name; \ |
776 | | \ |
777 | 18.0M | static void unique_list_##name##_init(unique_list_##name * s) \ |
778 | 18.0M | { \ |
779 | 18.0M | memset(s->list, 0, sizeof(s->list)); \ |
780 | 18.0M | s->size = 0; \ |
781 | 18.0M | } \ rv60dec.c:unique_list_intramode_init Line | Count | Source | 777 | 9.51M | static void unique_list_##name##_init(unique_list_##name * s) \ | 778 | 9.51M | { \ | 779 | 9.51M | memset(s->list, 0, sizeof(s->list)); \ | 780 | 9.51M | s->size = 0; \ | 781 | 9.51M | } \ |
rv60dec.c:unique_list_mvinfo_init Line | Count | Source | 777 | 8.51M | static void unique_list_##name##_init(unique_list_##name * s) \ | 778 | 8.51M | { \ | 779 | 8.51M | memset(s->list, 0, sizeof(s->list)); \ | 780 | 8.51M | s->size = 0; \ | 781 | 8.51M | } \ |
|
782 | | \ |
783 | 131M | static void unique_list_##name##_add(unique_list_##name * s, type cand) \ |
784 | 131M | { \ |
785 | 131M | if (s->size == max_size) \ |
786 | 131M | return; \ |
787 | 131M | \ |
788 | 131M | for (int i = 0; i < s->size; i++) { \ |
789 | 87.5M | if (!memcmp(&s->list[i], &cand, sizeof(type))) { \ |
790 | 57.2M | return; \ |
791 | 57.2M | } \ |
792 | 87.5M | } \ |
793 | 94.6M | s->list[s->size++] = cand; \ |
794 | 37.3M | } rv60dec.c:unique_list_intramode_add Line | Count | Source | 783 | 82.7M | static void unique_list_##name##_add(unique_list_##name * s, type cand) \ | 784 | 82.7M | { \ | 785 | 82.7M | if (s->size == max_size) \ | 786 | 82.7M | return; \ | 787 | 82.7M | \ | 788 | 82.7M | for (int i = 0; i < s->size; i++) { \ | 789 | 46.3M | if (!memcmp(&s->list[i], &cand, sizeof(type))) { \ | 790 | 17.0M | return; \ | 791 | 17.0M | } \ | 792 | 46.3M | } \ | 793 | 45.5M | s->list[s->size++] = cand; \ | 794 | 28.5M | } |
rv60dec.c:unique_list_mvinfo_add Line | Count | Source | 783 | 49.1M | static void unique_list_##name##_add(unique_list_##name * s, type cand) \ | 784 | 49.1M | { \ | 785 | 49.1M | if (s->size == max_size) \ | 786 | 49.1M | return; \ | 787 | 49.1M | \ | 788 | 49.9M | for (int i = 0; i < s->size; i++) { \ | 789 | 41.1M | if (!memcmp(&s->list[i], &cand, sizeof(type))) { \ | 790 | 40.2M | return; \ | 791 | 40.2M | } \ | 792 | 41.1M | } \ | 793 | 49.0M | s->list[s->size++] = cand; \ | 794 | 8.82M | } |
|
795 | | |
796 | | MK_UNIQUELIST(intramode, enum IntraMode, 3) |
797 | | MK_UNIQUELIST(mvinfo, MVInfo, 4) |
798 | | |
799 | | static int reconstruct_intra(const RV60Context * s, const CUContext * cu, int size, int sub) |
800 | 9.95M | { |
801 | 9.95M | int blk_pos, tl_x, tl_y; |
802 | 9.95M | unique_list_intramode ipm_cand; |
803 | | |
804 | 9.95M | if (cu->imode[0] == INTRAMODE_DC64) |
805 | 436k | return 1; |
806 | | |
807 | 9.51M | if (cu->imode[0] == INTRAMODE_PLANE64) |
808 | 3.57k | return 0; |
809 | | |
810 | 9.51M | unique_list_intramode_init(&ipm_cand); |
811 | | |
812 | 9.51M | if (has_top_block(s, cu->xpos, cu->ypos, (sub & 1) * 4, 0, size)) { |
813 | 8.23M | const PUInfo * pu = &s->pu_info[cu->pu_pos - s->pu_stride]; |
814 | 8.23M | if (pu_is_intra(pu)) |
815 | 8.16M | unique_list_intramode_add(&ipm_cand, s->blk_info[cu->blk_pos - s->blk_stride + (sub & 1)].imode); |
816 | 8.23M | } |
817 | | |
818 | 9.51M | blk_pos = cu->blk_pos + (sub >> 1) * s->blk_stride + (sub & 1); |
819 | | |
820 | 9.51M | if (has_left_block(s, cu->xpos, cu->ypos, 0, (sub & 2) * 2, size)) { |
821 | 9.15M | const PUInfo * pu = &s->pu_info[cu->pu_pos - 1]; |
822 | 9.15M | if (pu_is_intra(pu)) |
823 | 9.08M | unique_list_intramode_add(&ipm_cand, s->blk_info[blk_pos - 1 - (sub & 1)].imode); |
824 | 9.15M | } |
825 | | |
826 | 9.51M | tl_x = !(sub & 2) ? (cu->xpos + (sub & 1) * 4) : cu->xpos; |
827 | 9.51M | tl_y = cu->ypos + (sub & 2) * 4; |
828 | 9.51M | if (tl_x > 0 && tl_y > 0) { |
829 | 8.50M | const PUInfo * pu; |
830 | 8.50M | switch (sub) { |
831 | 2.29M | case 0: pu = &s->pu_info[cu->pu_pos - s->pu_stride - 1]; break; |
832 | 1.96M | case 1: pu = &s->pu_info[cu->pu_pos - s->pu_stride]; break; |
833 | 4.23M | default: pu = &s->pu_info[cu->pu_pos - 1]; |
834 | 8.50M | } |
835 | 8.50M | if (pu_is_intra(pu)) { |
836 | 8.41M | if (sub != 3) |
837 | 6.30M | unique_list_intramode_add(&ipm_cand, s->blk_info[blk_pos - s->blk_stride - 1].imode); |
838 | 2.11M | else |
839 | 2.11M | unique_list_intramode_add(&ipm_cand, s->blk_info[blk_pos - s->blk_stride - 2].imode); |
840 | 8.41M | } |
841 | 8.50M | } |
842 | | |
843 | 66.6M | for (int i = 0; i < FF_ARRAY_ELEMS(rv60_candidate_intra_angles); i++) |
844 | 57.0M | unique_list_intramode_add(&ipm_cand, rv60_candidate_intra_angles[i]); |
845 | | |
846 | 9.51M | if (cu->imode[sub] == INTRAMODE_INDEX) |
847 | 8.52M | return ipm_cand.list[cu->imode_param[sub]]; |
848 | | |
849 | 991k | if (cu->imode[sub] == INTRAMODE_MODE) { |
850 | 991k | enum IntraMode imode = cu->imode_param[sub]; |
851 | 991k | qsort(ipm_cand.list, 3, sizeof(ipm_cand.list[0]), ipm_compar); |
852 | 3.96M | for (int i = 0; i < 3; i++) |
853 | 2.97M | if (imode >= ipm_cand.list[i]) |
854 | 2.27M | imode++; |
855 | 991k | return imode; |
856 | 991k | } |
857 | | |
858 | 0 | av_assert0(0); // should never reach here |
859 | 0 | return 0; |
860 | 0 | } |
861 | | |
862 | | static int get_skip_mv_index(enum MVRefEnum mvref) |
863 | 8.51M | { |
864 | 8.51M | switch (mvref) { |
865 | 72.7k | case MVREF_SKIP1: return 1; |
866 | 32.9k | case MVREF_SKIP2: return 2; |
867 | 8.34M | case MVREF_SKIP3: return 3; |
868 | 61.7k | default: return 0; |
869 | 8.51M | } |
870 | 8.51M | } |
871 | | |
872 | | static void add_if_valid(unique_list_mvinfo * skip_cand, const MVInfo * mvi) |
873 | 58.5M | { |
874 | 58.5M | if (mvi->mvref != MVREF_NONE) |
875 | 49.1M | unique_list_mvinfo_add(skip_cand, *mvi); |
876 | 58.5M | } |
877 | | |
878 | | static void fill_mv_skip_cand(RV60Context * s, const CUContext * cu, unique_list_mvinfo * skip_cand, int size) |
879 | 8.51M | { |
880 | 8.51M | int mv_size = size >> 2; |
881 | | |
882 | 8.51M | if (cu->xpos) |
883 | 8.46M | add_if_valid(skip_cand, &s->blk_info[cu->blk_pos - 1].mv); |
884 | 8.51M | if (cu->ypos) |
885 | 8.35M | add_if_valid(skip_cand, &s->blk_info[cu->blk_pos - s->blk_stride].mv); |
886 | 8.51M | if (cu->ypos && cu->xpos + size < s->awidth) |
887 | 8.28M | add_if_valid(skip_cand, &s->blk_info[cu->blk_pos - s->blk_stride + mv_size].mv); |
888 | 8.51M | if (cu->xpos && cu->ypos + size < s->aheight) |
889 | 8.36M | add_if_valid(skip_cand, &s->blk_info[cu->blk_pos + s->blk_stride * mv_size - 1].mv); |
890 | 8.51M | if (cu->xpos) |
891 | 8.46M | add_if_valid(skip_cand, &s->blk_info[cu->blk_pos + s->blk_stride * (mv_size - 1) - 1].mv); |
892 | 8.51M | if (cu->ypos) |
893 | 8.35M | add_if_valid(skip_cand, &s->blk_info[cu->blk_pos - s->blk_stride + mv_size - 1].mv); |
894 | 8.51M | if (cu->xpos && cu->ypos) |
895 | 8.30M | add_if_valid(skip_cand, &s->blk_info[cu->blk_pos - s->blk_stride - 1].mv); |
896 | | |
897 | 33.7M | for (int i = skip_cand->size; i < 4; i++) |
898 | 25.2M | skip_cand->list[i] = (MVInfo){.mvref=MVREF_REF0,.f_mv={0,0},.b_mv={0,0}}; |
899 | 8.51M | } |
900 | | |
901 | | typedef struct { |
902 | | int w, h; |
903 | | } Dimensions; |
904 | | |
905 | | static void get_mv_dimensions(Dimensions * dim, enum PUType pu_type, int part_no, int size) |
906 | 9.78M | { |
907 | 9.78M | int mv_size = size >> 2; |
908 | 9.78M | switch (pu_type) { |
909 | 8.52M | case PU_FULL: |
910 | 8.52M | dim->w = dim->h = mv_size; |
911 | 8.52M | break; |
912 | 129k | case PU_N2HOR: |
913 | 129k | dim->w = mv_size; |
914 | 129k | dim->h = mv_size >> 1; |
915 | 129k | break; |
916 | 527k | case PU_N2VER: |
917 | 527k | dim->w = mv_size >> 1; |
918 | 527k | dim->h = mv_size; |
919 | 527k | break; |
920 | 560k | case PU_QUARTERS: |
921 | 560k | dim->w = dim->h = mv_size >> 1; |
922 | 560k | break; |
923 | 11.9k | case PU_N4HOR: |
924 | 11.9k | dim->w = mv_size; |
925 | 11.9k | dim->h = !part_no ? (mv_size >> 2) : ((3 * mv_size) >> 2); |
926 | 11.9k | break; |
927 | 13.3k | case PU_N34HOR: |
928 | 13.3k | dim->w = mv_size; |
929 | 13.3k | dim->h = !part_no ? ((3 * mv_size) >> 2) : (mv_size >> 2); |
930 | 13.3k | break; |
931 | 8.93k | case PU_N4VER: |
932 | 8.93k | dim->w = !part_no ? (mv_size >> 2) : ((3 * mv_size) >> 2); |
933 | 8.93k | dim->h = mv_size; |
934 | 8.93k | break; |
935 | 7.38k | case PU_N34VER: |
936 | 7.38k | dim->w = !part_no ? ((3 * mv_size) >> 2) : (mv_size >> 2); |
937 | 7.38k | dim->h = mv_size; |
938 | 7.38k | break; |
939 | 9.78M | } |
940 | 9.78M | } |
941 | | |
942 | | static int has_hor_split(enum PUType pu_type) |
943 | 9.21M | { |
944 | 9.21M | return pu_type == PU_N2HOR || pu_type == PU_N4HOR || pu_type == PU_N34HOR || pu_type == PU_QUARTERS; |
945 | 9.21M | } |
946 | | |
947 | | static int has_ver_split(enum PUType pu_type) |
948 | 9.05M | { |
949 | 9.05M | return pu_type == PU_N2VER || pu_type == PU_N4VER || pu_type == PU_N34VER || pu_type == PU_QUARTERS; |
950 | 9.05M | } |
951 | | |
952 | | static int pu_type_num_parts(enum PUType pu_type) |
953 | 9.27M | { |
954 | 9.27M | switch (pu_type) { |
955 | 8.53M | case PU_FULL: return 1; |
956 | 211k | case PU_QUARTERS: return 4; |
957 | 529k | default: return 2; |
958 | 9.27M | } |
959 | 9.27M | } |
960 | | |
961 | | static void get_next_mv(const RV60Context * s, const Dimensions * dim, enum PUType pu_type, int part_no, int * mv_pos, int * mv_x, int * mv_y) |
962 | 9.77M | { |
963 | 9.77M | if (pu_type == PU_QUARTERS) { |
964 | 560k | if (part_no != 1) { |
965 | 420k | *mv_pos += dim->w; |
966 | 420k | *mv_x += dim->w; |
967 | 420k | } else { |
968 | 140k | *mv_pos += dim->h*s->blk_stride - dim->w; |
969 | 140k | *mv_x -= dim->w; |
970 | 140k | *mv_y += dim->h; |
971 | 140k | } |
972 | 9.21M | } else if (has_hor_split(pu_type)) { |
973 | 150k | *mv_pos += dim->h * s->blk_stride; |
974 | 150k | *mv_y += dim->h; |
975 | 9.05M | } else if (has_ver_split(pu_type)) { |
976 | 539k | *mv_pos += dim->w; |
977 | 539k | *mv_x += dim->w; |
978 | 539k | } |
979 | 9.77M | } |
980 | | |
981 | | static int mv_is_ref0(enum MVRefEnum mvref) |
982 | 478k | { |
983 | 478k | return mvref == MVREF_REF0 || mvref == MVREF_REF0ANDBREF; |
984 | 478k | } |
985 | | |
986 | | static int mv_is_forward(enum MVRefEnum mvref) |
987 | 17.6M | { |
988 | 17.6M | return mvref == MVREF_REF0 || mvref == MVREF_REF1 || mvref == MVREF_REF0ANDBREF; |
989 | 17.6M | } |
990 | | |
991 | | static int mv_is_backward(enum MVRefEnum mvref) |
992 | 18.8M | { |
993 | 18.8M | return mvref == MVREF_BREF || mvref == MVREF_REF0ANDBREF; |
994 | 18.8M | } |
995 | | |
996 | | static int mvinfo_matches_forward(const MVInfo * a, const MVInfo * b) |
997 | 1.40M | { |
998 | 1.40M | return a->mvref == b->mvref || (mv_is_ref0(a->mvref) && mv_is_ref0(b->mvref)); |
999 | 1.40M | } |
1000 | | |
1001 | | static int mvinfo_matches_backward(const MVInfo * a, const MVInfo * b) |
1002 | 778k | { |
1003 | 778k | return mv_is_backward(a->mvref) && mv_is_backward(b->mvref); |
1004 | 778k | } |
1005 | | |
1006 | | static int mvinfo_is_deblock_cand(const MVInfo * a, const MVInfo * b) |
1007 | 17.3M | { |
1008 | 17.3M | int diff; |
1009 | | |
1010 | 17.3M | if (a->mvref != b->mvref) |
1011 | 381k | return 1; |
1012 | | |
1013 | 17.0M | diff = 0; |
1014 | 17.0M | if (mv_is_forward(a->mvref)) { |
1015 | 16.9M | int dx = a->f_mv.x - b->f_mv.x; |
1016 | 16.9M | int dy = a->f_mv.y - b->f_mv.y; |
1017 | 16.9M | diff += FFABS(dx) + FFABS(dy); |
1018 | 16.9M | } |
1019 | 17.0M | if (mv_is_backward(a->mvref)) { |
1020 | 1.60M | int dx = a->b_mv.x - b->b_mv.x; |
1021 | 1.60M | int dy = a->b_mv.y - b->b_mv.y; |
1022 | 1.60M | diff += FFABS(dx) + FFABS(dy); |
1023 | 1.60M | } |
1024 | 17.0M | return diff > 4; |
1025 | 17.3M | } |
1026 | | |
1027 | | static void mv_pred(MV * ret, MV a, MV b, MV c) |
1028 | 328k | { |
1029 | 328k | #define MEDIAN(x) \ |
1030 | 656k | if (a.x < b.x) \ |
1031 | 656k | if (b.x < c.x) \ |
1032 | 313k | ret->x = b.x; \ |
1033 | 313k | else \ |
1034 | 313k | ret->x = a.x < c.x ? c.x : a.x; \ |
1035 | 656k | else \ |
1036 | 656k | if (b.x < c.x) \ |
1037 | 342k | ret->x = a.x < c.x ? a.x : c.x; \ |
1038 | 342k | else \ |
1039 | 342k | ret->x = b.x; \ |
1040 | 328k | |
1041 | 328k | MEDIAN(x) |
1042 | 328k | MEDIAN(y) |
1043 | 328k | } |
1044 | | |
1045 | | static void predict_mv(const RV60Context * s, MVInfo * dst, int mv_x, int mv_y, int mv_w, const MVInfo * src) |
1046 | 641k | { |
1047 | 641k | int mv_pos = mv_y * s->blk_stride + mv_x; |
1048 | 641k | MV f_mv, b_mv; |
1049 | | |
1050 | 641k | dst->mvref = src->mvref; |
1051 | | |
1052 | 641k | if (mv_is_forward(src->mvref)) { |
1053 | 511k | MV cand[3] = {0}; |
1054 | 511k | int cand_size = 0; |
1055 | 511k | if (mv_x > 0) { |
1056 | 482k | const MVInfo * mv = &s->blk_info[mv_pos - 1].mv; |
1057 | 482k | if (mvinfo_matches_forward(mv, src)) |
1058 | 440k | cand[cand_size++] = mv->f_mv; |
1059 | 482k | } |
1060 | 511k | if (mv_y > 0) { |
1061 | 474k | const MVInfo * mv = &s->blk_info[mv_pos - s->blk_stride].mv; |
1062 | 474k | if (mvinfo_matches_forward(mv, src)) |
1063 | 369k | cand[cand_size++] = mv->f_mv; |
1064 | 474k | } |
1065 | 511k | if (has_top_block(s, mv_x << 2, mv_y << 2, mv_w << 2, 0, 4)) { |
1066 | 448k | const MVInfo * mv = &s->blk_info[mv_pos - s->blk_stride + mv_w].mv; |
1067 | 448k | if (mvinfo_matches_forward(mv, src)) |
1068 | 275k | cand[cand_size++] = mv->f_mv; |
1069 | 448k | } |
1070 | | |
1071 | 511k | switch (cand_size) { |
1072 | 125k | case 1: |
1073 | 125k | f_mv.x = cand[0].x; |
1074 | 125k | f_mv.y = cand[0].y; |
1075 | 125k | break; |
1076 | 103k | case 2: |
1077 | 103k | f_mv.x = (cand[0].x + cand[1].x) >> 1; |
1078 | 103k | f_mv.y = (cand[0].y + cand[1].y) >> 1; |
1079 | 103k | break; |
1080 | 251k | case 3: |
1081 | 251k | mv_pred(&f_mv, cand[0], cand[1], cand[2]); |
1082 | 251k | break; |
1083 | 31.4k | default: |
1084 | 31.4k | f_mv = (MV){0,0}; |
1085 | 31.4k | break; |
1086 | 511k | } |
1087 | 511k | } else { |
1088 | 130k | f_mv = (MV){0,0}; |
1089 | 130k | } |
1090 | | |
1091 | 641k | dst->f_mv.x = src->f_mv.x + f_mv.x; |
1092 | 641k | dst->f_mv.y = src->f_mv.y + f_mv.y; |
1093 | | |
1094 | 641k | if (mv_is_backward(src->mvref)) { |
1095 | 273k | MV cand[3] = {0}; |
1096 | 273k | int cand_size = 0; |
1097 | 273k | if (mv_x > 0) { |
1098 | 271k | const MVInfo * mv = &s->blk_info[mv_pos - 1].mv; |
1099 | 271k | if (mvinfo_matches_backward(mv, src)) |
1100 | 186k | cand[cand_size++] = mv->b_mv; |
1101 | 271k | } |
1102 | 273k | if (mv_y > 0) { |
1103 | 256k | const MVInfo * mv = &s->blk_info[mv_pos - s->blk_stride].mv; |
1104 | 256k | if (mvinfo_matches_backward(mv, src)) |
1105 | 157k | cand[cand_size++] = mv->b_mv; |
1106 | 256k | } |
1107 | 273k | if (has_top_block(s, mv_x << 2, mv_y << 2, mv_w << 2, 0, 4)) { |
1108 | 251k | const MVInfo * mv = &s->blk_info[mv_pos - s->blk_stride + mv_w].mv; |
1109 | 251k | if (mvinfo_matches_backward(mv, src)) |
1110 | 105k | cand[cand_size++] = mv->b_mv; |
1111 | 251k | } |
1112 | | |
1113 | 273k | switch (cand_size) { |
1114 | 124k | case 1: |
1115 | 124k | b_mv.x = cand[0].x; |
1116 | 124k | b_mv.y = cand[0].y; |
1117 | 124k | break; |
1118 | 47.1k | case 2: |
1119 | 47.1k | b_mv.x = (cand[0].x + cand[1].x) >> 1; |
1120 | 47.1k | b_mv.y = (cand[0].y + cand[1].y) >> 1; |
1121 | 47.1k | break; |
1122 | 76.6k | case 3: |
1123 | 76.6k | mv_pred(&b_mv, cand[0], cand[1], cand[2]); |
1124 | 76.6k | break; |
1125 | 25.0k | default: |
1126 | 25.0k | b_mv = (MV){0,0}; |
1127 | 25.0k | break; |
1128 | 273k | } |
1129 | 367k | } else { |
1130 | 367k | b_mv = (MV){0,0}; |
1131 | 367k | } |
1132 | | |
1133 | 641k | dst->b_mv.x = src->b_mv.x + b_mv.x; |
1134 | 641k | dst->b_mv.y = src->b_mv.y + b_mv.y; |
1135 | 641k | } |
1136 | | |
1137 | | static void reconstruct(RV60Context * s, const CUContext * cu, int size) |
1138 | 12.1M | { |
1139 | 12.1M | int pu_size = size >> 3; |
1140 | 12.1M | PUInfo pui; |
1141 | 12.1M | int imode, mv_x, mv_y, mv_pos, count, mv_size; |
1142 | 12.1M | unique_list_mvinfo skip_cand; |
1143 | 12.1M | Dimensions dim; |
1144 | 12.1M | MVInfo mv; |
1145 | | |
1146 | 12.1M | pui.cu_type = cu->cu_type; |
1147 | 12.1M | pui.pu_type = cu->pu_type; |
1148 | | |
1149 | 12.1M | if (cu->cu_type == CU_INTRA && cu->pu_type == PU_QUARTERS) { |
1150 | 2.19M | s->pu_info[cu->pu_pos] = pui; |
1151 | 6.59M | for (int y = 0; y < 2; y++) |
1152 | 13.1M | for (int x = 0; x < 2; x++) |
1153 | 8.79M | s->blk_info[cu->blk_pos + y*s->blk_stride + x].imode = |
1154 | 8.79M | reconstruct_intra(s, cu, 4, y*2 + x); |
1155 | 2.19M | return; |
1156 | 2.19M | } |
1157 | | |
1158 | 9.93M | switch (cu->cu_type) { |
1159 | 1.16M | case CU_INTRA: |
1160 | 1.16M | imode = reconstruct_intra(s, cu, size, 0); |
1161 | 11.7M | for (int y = 0; y < size >> 2; y++) |
1162 | 144M | for (int x = 0; x < size >> 2; x++) |
1163 | 133M | s->blk_info[cu->blk_pos + y*s->blk_stride + x].imode = imode; |
1164 | 1.16M | break; |
1165 | 253k | case CU_INTER_MV: |
1166 | 253k | mv_x = cu->xpos >> 2; |
1167 | 253k | mv_y = cu->ypos >> 2; |
1168 | 253k | mv_pos = cu->blk_pos; |
1169 | 253k | count = pu_type_num_parts(cu->pu_type); |
1170 | 895k | for (int part_no = 0; part_no < count; part_no++) { |
1171 | 641k | MVInfo mv; |
1172 | 641k | get_mv_dimensions(&dim, cu->pu_type, part_no, size); |
1173 | 641k | predict_mv(s, &mv, mv_x, mv_y, dim.w, &cu->mv[part_no]); |
1174 | 4.93M | for (int y = 0; y < dim.h; y++) |
1175 | 33.8M | for (int x = 0; x < dim.w; x++) |
1176 | 29.5M | s->blk_info[mv_pos + y*s->blk_stride + x].mv = mv; |
1177 | 641k | get_next_mv(s, &dim, cu->pu_type, part_no, &mv_pos, &mv_x, &mv_y); |
1178 | 641k | } |
1179 | 253k | break; |
1180 | 8.51M | default: |
1181 | 8.51M | unique_list_mvinfo_init(&skip_cand); |
1182 | 8.51M | fill_mv_skip_cand(s, cu, &skip_cand, size); |
1183 | 8.51M | mv = skip_cand.list[get_skip_mv_index(cu->mv[0].mvref)]; |
1184 | 8.51M | mv_size = size >> 2; |
1185 | 25.8M | for (int y = 0; y < mv_size; y++) |
1186 | 56.4M | for (int x = 0; x < mv_size; x++) |
1187 | 39.0M | s->blk_info[cu->blk_pos + y*s->blk_stride + x].mv = mv; |
1188 | 9.93M | } |
1189 | | |
1190 | 25.0M | for (int y = 0; y < pu_size; y++) |
1191 | 65.7M | for (int x = 0; x < pu_size; x++) |
1192 | 50.6M | s->pu_info[cu->pu_pos + y*s->pu_stride + x] = pui; |
1193 | 9.93M | } |
1194 | | |
1195 | | static void read_mv(GetBitContext * gb, MV * mv) |
1196 | 784k | { |
1197 | 784k | mv->x = get_interleaved_se_golomb(gb); |
1198 | 784k | mv->y = get_interleaved_se_golomb(gb); |
1199 | 784k | } |
1200 | | |
1201 | | static void read_mv_info(RV60Context *s, GetBitContext * gb, MVInfo * mvinfo, int size, enum PUType pu_type) |
1202 | 641k | { |
1203 | 641k | if (s->pict_type != AV_PICTURE_TYPE_B) { |
1204 | 279k | if (s->two_f_refs && get_bits1(gb)) |
1205 | 13.5k | mvinfo->mvref = MVREF_REF1; |
1206 | 266k | else |
1207 | 266k | mvinfo->mvref = MVREF_REF0; |
1208 | 279k | read_mv(gb, &mvinfo->f_mv); |
1209 | 279k | mvinfo->b_mv.x = mvinfo->b_mv.y = 0; |
1210 | 361k | } else { |
1211 | 361k | if ((size <= 8 && (size != 8 || pu_type != PU_FULL)) || get_bits1(gb)) { |
1212 | 218k | if (!get_bits1(gb)) { |
1213 | 87.9k | mvinfo->mvref = MVREF_REF0; |
1214 | 87.9k | read_mv(gb, &mvinfo->f_mv); |
1215 | 87.9k | mvinfo->b_mv.x = mvinfo->b_mv.y = 0; |
1216 | 130k | } else { |
1217 | 130k | mvinfo->mvref = MVREF_BREF; |
1218 | 130k | mvinfo->f_mv.x = mvinfo->f_mv.y = 0; |
1219 | 130k | read_mv(gb, &mvinfo->b_mv); |
1220 | 130k | } |
1221 | 218k | } else { |
1222 | 143k | mvinfo->mvref = MVREF_REF0ANDBREF; |
1223 | 143k | read_mv(gb, &mvinfo->f_mv); |
1224 | 143k | read_mv(gb, &mvinfo->b_mv); |
1225 | 143k | } |
1226 | 361k | } |
1227 | 641k | } |
1228 | | |
1229 | | #define FILTER1(src, src_stride, src_y_ofs, step) \ |
1230 | | ( (src)[(y + src_y_ofs)*(src_stride) + x - 2*step] \ |
1231 | | - 5 * (src)[(y + src_y_ofs)*(src_stride) + x - 1*step] \ |
1232 | | +52 * (src)[(y + src_y_ofs)*(src_stride) + x ] \ |
1233 | | +20 * (src)[(y + src_y_ofs)*(src_stride) + x + 1*step] \ |
1234 | | - 5 * (src)[(y + src_y_ofs)*(src_stride) + x + 2*step] \ |
1235 | | + (src)[(y + src_y_ofs)*(src_stride) + x + 3*step] + 32) >> 6 |
1236 | | |
1237 | | #define FILTER2(src, src_stride, src_y_ofs, step) \ |
1238 | | ( (src)[(y + src_y_ofs)*(src_stride) + x - 2*step] \ |
1239 | | - 5 * (src)[(y + src_y_ofs)*(src_stride) + x - 1*step] \ |
1240 | | +20 * (src)[(y + src_y_ofs)*(src_stride) + x ] \ |
1241 | | +20 * (src)[(y + src_y_ofs)*(src_stride) + x + 1*step] \ |
1242 | | - 5 * (src)[(y + src_y_ofs)*(src_stride) + x + 2*step] \ |
1243 | | + (src)[(y + src_y_ofs)*(src_stride) + x + 3*step] + 16) >> 5 |
1244 | | |
1245 | | #define FILTER3(src, src_stride, src_y_ofs, step) \ |
1246 | | ( (src)[(y + src_y_ofs)*(src_stride) + x - 2*step] \ |
1247 | | - 5 * (src)[(y + src_y_ofs)*(src_stride) + x - 1*step] \ |
1248 | | +20 * (src)[(y + src_y_ofs)*(src_stride) + x ] \ |
1249 | | +52 * (src)[(y + src_y_ofs)*(src_stride) + x + 1*step] \ |
1250 | | - 5 * (src)[(y + src_y_ofs)*(src_stride) + x + 2*step] \ |
1251 | | + (src)[(y + src_y_ofs)*(src_stride) + x + 3*step] + 32) >> 6 |
1252 | | |
1253 | | #define FILTER_CASE(idx, dst, dst_stride, filter, w, h) \ |
1254 | 881k | case idx: \ |
1255 | 28.9M | for (int y = 0; y < h; y++) \ |
1256 | 798M | for (int x = 0; x < w; x++) \ |
1257 | 770M | (dst)[y*dst_stride + x] = av_clip_uint8(filter); \ |
1258 | 881k | break; |
1259 | | |
1260 | | #define FILTER_BLOCK(dst, dst_stride, src, src_stride, src_y_ofs, w, h, cond, step) \ |
1261 | 881k | switch (cond) { \ |
1262 | 455k | FILTER_CASE(1, dst, dst_stride, FILTER1(src, src_stride, src_y_ofs, step), w, h) \ |
1263 | 332k | FILTER_CASE(2, dst, dst_stride, FILTER2(src, src_stride, src_y_ofs, step), w, h) \ |
1264 | 881k | FILTER_CASE(3, dst, dst_stride, FILTER3(src, src_stride, src_y_ofs, step), w, h) \ |
1265 | 881k | } |
1266 | | |
1267 | | static void luma_mc(uint8_t * dst, int dst_stride, const uint8_t * src, int src_stride, int w, int h, int cx, int cy) |
1268 | 9.27M | { |
1269 | 9.27M | if (!cx && !cy) { |
1270 | 82.2M | for (int y = 0; y < h; y++) |
1271 | 73.5M | memcpy(dst + y*dst_stride, src + y*src_stride, w); |
1272 | 8.64M | } else if (!cy) { |
1273 | 81.8k | FILTER_BLOCK(dst, dst_stride, src, src_stride, 0, w, h, cx, 1) |
1274 | 544k | } else if (!cx) { |
1275 | 54.2k | FILTER_BLOCK(dst, dst_stride, src, src_stride, 0, w, h, cy, src_stride) |
1276 | 490k | } else if (cx != 3 || cy != 3) { |
1277 | 372k | uint8_t tmp[70 * 64]; |
1278 | 372k | FILTER_BLOCK(tmp, 64, src - src_stride * 2, src_stride, 0, w, h + 5, cx, 1) |
1279 | 372k | FILTER_BLOCK(dst, dst_stride, tmp + 2*64, 64, 0, w, h, cy, 64) |
1280 | 372k | } else { |
1281 | 4.84M | for (int j = 0; j < h; j++) |
1282 | 138M | for (int i = 0; i < w; i++) |
1283 | 133M | dst[j*dst_stride + i] = ( |
1284 | 133M | src[j*src_stride + i] + |
1285 | 133M | src[j*src_stride + i + 1] + |
1286 | 133M | src[(j + 1)*src_stride + i] + |
1287 | 133M | src[(j + 1)*src_stride + i + 1] + 2) >> 2; |
1288 | 117k | } |
1289 | 9.27M | } |
1290 | | |
1291 | | static void chroma_mc(uint8_t * dst, int dst_stride, const uint8_t * src, int src_stride, int w, int h, int x, int y) |
1292 | 18.5M | { |
1293 | 18.5M | if (!x && !y) { |
1294 | 91.7M | for (int j = 0; j < h; j++) |
1295 | 74.3M | memcpy(dst + j*dst_stride, src + j*src_stride, w); |
1296 | 17.4M | } else if (x > 0 && y > 0) { |
1297 | 792k | int a, b, c, d; |
1298 | | |
1299 | 792k | if (x == 3 && y == 3) |
1300 | 235k | y = 2; //reproduce bug in rv60 decoder. tested with realplayer version 18.1.7.344 and 22.0.0.321 |
1301 | | |
1302 | 792k | a = (4 - x) * (4 - y); |
1303 | 792k | b = x * (4 - y); |
1304 | 792k | c = (4 - x) * y; |
1305 | 792k | d = x * y; |
1306 | 16.9M | for (int j = 0; j < h; j++) |
1307 | 249M | for (int i = 0; i < w; i++) |
1308 | 233M | dst[j*dst_stride + i] = |
1309 | 233M | (a * src[j*src_stride + i] + |
1310 | 233M | b * src[j*src_stride + i + 1] + |
1311 | 233M | c * src[(j + 1)*src_stride + i] + |
1312 | 233M | d * src[(j + 1)*src_stride + i + 1] + 8) >> 4; |
1313 | 792k | } else { |
1314 | 295k | int a = (4 - x) * (4 - y); |
1315 | 295k | int e = x * (4 - y) + (4 - x) * y; |
1316 | 295k | int step = y > 0 ? src_stride : 1; |
1317 | 2.28M | for (int j = 0; j < h; j++) |
1318 | 24.6M | for (int i = 0; i < w; i++) |
1319 | 22.6M | dst[j*dst_stride + i] = |
1320 | 22.6M | (a * src[j*src_stride + i] + |
1321 | 22.6M | e * src[j*src_stride + i + step] + 8) >> 4; |
1322 | 295k | } |
1323 | 18.5M | } |
1324 | | |
1325 | | static int check_pos(int x, int y, int cw, int ch, int w, int h, int dx, int dy, int e0, int e1, int e2, int e3) |
1326 | 27.8M | { |
1327 | 27.8M | int x2 = x + dx; |
1328 | 27.8M | int y2 = y + dy; |
1329 | 27.8M | return x2 - e0 >= 0 && x2 + cw + e1 <= w && y2 - e2 >= 0 && y2 + ch + e3 <= h; |
1330 | 27.8M | } |
1331 | | |
1332 | | static void mc(RV60Context * s, uint8_t * frame_data[3], int frame_linesize[3], const AVFrame * ref, int x, int y, int w, int h, MV mv, int avg) |
1333 | 9.27M | { |
1334 | 9.27M | { |
1335 | 9.27M | int off = !avg ? y * frame_linesize[0] + x : 0; |
1336 | 9.27M | int fw = s->awidth; |
1337 | 9.27M | int fh = s->aheight; |
1338 | 9.27M | int dx = mv.x >> 2; |
1339 | 9.27M | int cx = mv.x & 3; |
1340 | 9.27M | int dy = mv.y >> 2; |
1341 | 9.27M | int cy = mv.y & 3; |
1342 | | |
1343 | 9.27M | if (check_pos(x, y, w, h, fw, fh, dx, dy, rv60_edge1[cx], rv60_edge2[cx], rv60_edge1[cy], rv60_edge2[cy])) { |
1344 | 9.05M | luma_mc( |
1345 | 9.05M | frame_data[0] + off, |
1346 | 9.05M | frame_linesize[0], |
1347 | 9.05M | ref->data[0] + (y + dy) * ref->linesize[0] + x + dx, |
1348 | 9.05M | ref->linesize[0], |
1349 | 9.05M | w, h, cx, cy); |
1350 | 9.05M | } else { |
1351 | 223k | uint8_t buf[70*70]; |
1352 | 223k | int xoff = x + dx - 2; |
1353 | 223k | int yoff = y + dy - 2; |
1354 | 223k | s->vdsp.emulated_edge_mc(buf, |
1355 | 223k | ref->data[0] + yoff * ref->linesize[0] + xoff, |
1356 | 223k | 70, ref->linesize[0], |
1357 | 223k | w + 5, h + 5, |
1358 | 223k | xoff, yoff, |
1359 | 223k | fw, fh); |
1360 | | |
1361 | 223k | luma_mc(frame_data[0] + off, frame_linesize[0], |
1362 | 223k | buf + 70 * 2 + 2, 70, w, h, cx, cy); |
1363 | 223k | } |
1364 | 9.27M | } |
1365 | 9.27M | { |
1366 | 9.27M | int fw = s->awidth >> 1; |
1367 | 9.27M | int fh = s->aheight >> 1; |
1368 | 9.27M | int mvx = mv.x / 2; |
1369 | 9.27M | int mvy = mv.y / 2; |
1370 | 9.27M | int dx = mvx >> 2; |
1371 | 9.27M | int cx = mvx & 3; |
1372 | 9.27M | int dy = mvy >> 2; |
1373 | 9.27M | int cy = mvy & 3; |
1374 | 9.27M | int cw = w >> 1; |
1375 | 9.27M | int ch = h >> 1; |
1376 | | |
1377 | 27.8M | for (int plane = 1; plane < 3; plane++) { |
1378 | 18.5M | int off = !avg ? (y >> 1) * frame_linesize[plane] + (x >> 1) : 0; |
1379 | 18.5M | if (check_pos(x >> 1, y >> 1, cw, ch, fw, fh, dx, dy, 0, 1, 0, 1)) { |
1380 | 17.7M | chroma_mc( |
1381 | 17.7M | frame_data[plane] + off, |
1382 | 17.7M | frame_linesize[plane], |
1383 | 17.7M | ref->data[plane] + ((y >> 1) + dy) * ref->linesize[plane] + (x >> 1) + dx, |
1384 | 17.7M | ref->linesize[plane], |
1385 | 17.7M | cw, ch, cx, cy); |
1386 | 17.7M | } else { |
1387 | 762k | uint8_t buf[40*40]; |
1388 | 762k | s->vdsp.emulated_edge_mc(buf, |
1389 | 762k | ref->data[plane] + ((y >> 1) + dy) * ref->linesize[plane] + (x >> 1) + dx, |
1390 | 762k | 40, ref->linesize[plane], |
1391 | 762k | cw + 1, ch + 1, |
1392 | 762k | (x >> 1) + dx, (y >> 1) + dy, |
1393 | 762k | fw, fh); |
1394 | 762k | chroma_mc(frame_data[plane] + off, frame_linesize[plane], buf, 40, cw, ch, cx, cy); |
1395 | 762k | } |
1396 | 18.5M | } |
1397 | 9.27M | } |
1398 | 9.27M | } |
1399 | | |
1400 | | static void avg_plane(uint8_t * dst, int dst_stride, const uint8_t * src, int src_stride, int w, int h) |
1401 | 440k | { |
1402 | 13.6M | for (int j = 0; j < h; j++) |
1403 | 306M | for (int i = 0; i < w; i++) |
1404 | 293M | dst[j*dst_stride + i] = (dst[j*dst_stride + i] + src[j*src_stride + i]) >> 1; |
1405 | 440k | } |
1406 | | |
1407 | | static void avg(AVFrame * frame, uint8_t * prev_frame_data[3], int prev_frame_linesize[3], int x, int y, int w, int h) |
1408 | 146k | { |
1409 | 587k | for (int plane = 0; plane < 3; plane++) { |
1410 | 440k | int shift = !plane ? 0 : 1; |
1411 | 440k | avg_plane(frame->data[plane] + (y >> shift) * frame->linesize[plane] + (x >> shift), frame->linesize[plane], |
1412 | 440k | prev_frame_data[plane], prev_frame_linesize[plane], |
1413 | 440k | w >> shift, h >> shift); |
1414 | 440k | } |
1415 | 146k | } |
1416 | | |
1417 | | static int get_c4x4_set(int qp, int is_intra) |
1418 | 8.36M | { |
1419 | 8.36M | if (is_intra) |
1420 | 3.04M | return rv60_qp_to_idx[qp + 32]; |
1421 | 5.32M | else |
1422 | 5.32M | return rv60_qp_to_idx[qp]; |
1423 | 8.36M | } |
1424 | | |
1425 | | static int quant(int v, int q) |
1426 | 257M | { |
1427 | 257M | return (v * q + 8) >> 4; |
1428 | 257M | } |
1429 | | |
1430 | | static int decode_coeff(GetBitContext * gb, const CoeffVLCs * vlcs, int inval, int val) |
1431 | 257M | { |
1432 | 257M | int esc_sym; |
1433 | | |
1434 | 257M | if (inval != val) |
1435 | 176M | return inval && get_bits1(gb) ? -inval : inval; |
1436 | | |
1437 | 81.3M | esc_sym = get_vlc2(gb, vlcs->esc, 9, 2); |
1438 | 81.3M | if (esc_sym > 23) { |
1439 | 53.6M | int esc_bits = esc_sym - 23; |
1440 | 53.6M | val += (1 << esc_bits) + get_bits(gb, esc_bits) + 22; |
1441 | 53.6M | } else |
1442 | 27.7M | val += esc_sym; |
1443 | | |
1444 | 81.3M | return get_bits1(gb) ? -val : val; |
1445 | 257M | } |
1446 | | |
1447 | | static void decode_2x2_dc(GetBitContext * gb, const CoeffVLCs * vlcs, int16_t * coeffs, int stride, int block2, int dsc, int q_dc, int q_ac) |
1448 | 8.36M | { |
1449 | 8.36M | const uint8_t * lx; |
1450 | 8.36M | if (!dsc) |
1451 | 0 | return; |
1452 | | |
1453 | 8.36M | lx = rv60_dsc_to_lx[dsc - 1]; |
1454 | | |
1455 | 8.36M | coeffs[0] = quant(decode_coeff(gb, vlcs, lx[0], 3), q_dc); |
1456 | 8.36M | if (!block2) { |
1457 | 8.36M | coeffs[1] = quant(decode_coeff(gb, vlcs, lx[1], 2), q_ac); |
1458 | 8.36M | coeffs[stride] = quant(decode_coeff(gb, vlcs, lx[2], 2), q_ac); |
1459 | 8.36M | } else { |
1460 | 0 | coeffs[stride] = quant(decode_coeff(gb, vlcs, lx[1], 2), q_ac); |
1461 | 0 | coeffs[1] = quant(decode_coeff(gb, vlcs, lx[2], 2), q_ac); |
1462 | 0 | } |
1463 | 8.36M | coeffs[stride + 1] = quant(decode_coeff(gb, vlcs, lx[3], 2), q_ac); |
1464 | 8.36M | } |
1465 | | |
1466 | | static void decode_2x2(GetBitContext * gb, const CoeffVLCs * vlcs, int16_t * coeffs, int stride, int block2, int dsc, int q_ac) |
1467 | 56.1M | { |
1468 | 56.1M | const uint8_t * lx; |
1469 | 56.1M | if (!dsc) |
1470 | 0 | return; |
1471 | | |
1472 | 56.1M | lx = rv60_dsc_to_lx[dsc - 1]; |
1473 | | |
1474 | 56.1M | coeffs[0] = quant(decode_coeff(gb, vlcs, lx[0], 3), q_ac); |
1475 | 56.1M | if (!block2) { |
1476 | 44.1M | coeffs[1] = quant(decode_coeff(gb, vlcs, lx[1], 2), q_ac); |
1477 | 44.1M | coeffs[stride] = quant(decode_coeff(gb, vlcs, lx[2], 2), q_ac); |
1478 | 44.1M | } else { |
1479 | 11.9M | coeffs[stride] = quant(decode_coeff(gb, vlcs, lx[1], 2), q_ac); |
1480 | 11.9M | coeffs[1] = quant(decode_coeff(gb, vlcs, lx[2], 2), q_ac); |
1481 | 11.9M | } |
1482 | 56.1M | coeffs[stride + 1] = quant(decode_coeff(gb, vlcs, lx[3], 2), q_ac); |
1483 | 56.1M | } |
1484 | | |
1485 | | static void decode_4x4_block_dc(GetBitContext * gb, const CoeffVLCs * vlcs, int is_luma, int16_t * coeffs, int stride, int q_dc, int q_ac) |
1486 | 8.64M | { |
1487 | 8.64M | int sym0 = get_vlc2(gb, vlcs->l0[!is_luma], 9, 2); |
1488 | 8.64M | int grp0 = sym0 >> 3; |
1489 | | |
1490 | 8.64M | if (grp0) |
1491 | 8.36M | decode_2x2_dc(gb, vlcs, coeffs, stride, 0, grp0, q_dc, q_ac); |
1492 | | |
1493 | 8.64M | if (sym0 & 4) { |
1494 | 4.25M | int grp = get_vlc2(gb, vlcs->l12[!is_luma], 9, 2); |
1495 | 4.25M | decode_2x2(gb, vlcs, coeffs + 2, stride, 0, grp, q_ac); |
1496 | 4.25M | } |
1497 | 8.64M | if (sym0 & 2) { |
1498 | 2.60M | int grp = get_vlc2(gb, vlcs->l12[!is_luma], 9, 2); |
1499 | 2.60M | decode_2x2(gb, vlcs, coeffs + 2*stride, stride, 1, grp, q_ac); |
1500 | 2.60M | } |
1501 | 8.64M | if (sym0 & 1) { |
1502 | 4.97M | int grp = get_vlc2(gb, vlcs->l3[!is_luma], 9, 2); |
1503 | 4.97M | decode_2x2(gb, vlcs, coeffs + 2*stride + 2, stride, 0, grp, q_ac); |
1504 | 4.97M | } |
1505 | 8.64M | } |
1506 | | |
1507 | | static void decode_4x4_block(GetBitContext * gb, const CoeffVLCs * vlcs, int is_luma, int16_t * coeffs, int stride, int q_ac) |
1508 | 20.0M | { |
1509 | 20.0M | int sym0 = get_vlc2(gb, vlcs->l0[!is_luma], 9, 2); |
1510 | 20.0M | int grp0 = (sym0 >> 3); |
1511 | | |
1512 | 20.0M | if (grp0) |
1513 | 18.5M | decode_2x2(gb, vlcs, coeffs, stride, 0, grp0, q_ac); |
1514 | | |
1515 | 20.0M | if (sym0 & 4) { |
1516 | 7.24M | int grp = get_vlc2(gb, vlcs->l12[!is_luma], 9, 2); |
1517 | 7.24M | decode_2x2(gb, vlcs, coeffs + 2, stride, 0, grp, q_ac); |
1518 | 7.24M | } |
1519 | 20.0M | if (sym0 & 2) { |
1520 | 9.36M | int grp = get_vlc2(gb, vlcs->l12[!is_luma], 9, 2); |
1521 | 9.36M | decode_2x2(gb, vlcs, coeffs + 2*stride, stride, 1, grp, q_ac); |
1522 | 9.36M | } |
1523 | 20.0M | if (sym0 & 1) { |
1524 | 9.16M | int grp = get_vlc2(gb, vlcs->l3[!is_luma], 9, 2); |
1525 | 9.16M | decode_2x2(gb, vlcs, coeffs + 2*stride + 2, stride, 0, grp, q_ac); |
1526 | 9.16M | } |
1527 | 20.0M | } |
1528 | | |
1529 | | static void decode_cu_4x4in16x16(GetBitContext * gb, int is_intra, int qp, int sel_qp, int16_t * y_coeffs, int16_t * u_coeffs, int16_t * v_coeffs, int cbp) |
1530 | 2.91k | { |
1531 | 2.91k | int cb_set = get_c4x4_set(sel_qp, is_intra); |
1532 | 2.91k | const CoeffVLCs * vlc = is_intra ? &intra_coeff_vlc[cb_set] : &inter_coeff_vlc[cb_set]; |
1533 | 2.91k | int q_y = rv60_quants_b[qp]; |
1534 | 2.91k | int q_c_dc = rv60_quants_b[rv60_chroma_quant_dc[qp]]; |
1535 | 2.91k | int q_c_ac = rv60_quants_b[rv60_chroma_quant_ac[qp]]; |
1536 | | |
1537 | 2.91k | memset(y_coeffs, 0, sizeof(y_coeffs[0])*256); |
1538 | 49.5k | for (int i = 0; i < 16; i++) |
1539 | 46.6k | if ((cbp >> i) & 1) |
1540 | 21.2k | decode_4x4_block(gb, vlc, 1, y_coeffs + i * 16 , 4, q_y); |
1541 | | |
1542 | 2.91k | memset(u_coeffs, 0, sizeof(u_coeffs[0])*64); |
1543 | 14.5k | for (int i = 0; i < 4; i++) |
1544 | 11.6k | if ((cbp >> (16 + i)) & 1) |
1545 | 2.15k | decode_4x4_block_dc(gb, vlc, 0, u_coeffs + i * 16, 4, q_c_dc, q_c_ac); |
1546 | | |
1547 | 2.91k | memset(v_coeffs, 0, sizeof(v_coeffs[0])*64); |
1548 | 14.5k | for (int i = 0; i < 4; i++) |
1549 | 11.6k | if ((cbp >> (20 + i)) & 1) |
1550 | 1.18k | decode_4x4_block_dc(gb, vlc, 0, v_coeffs + i * 16, 4, q_c_dc, q_c_ac); |
1551 | 2.91k | } |
1552 | | |
1553 | | static int decode_cbp8(GetBitContext * gb, int subset, int qp) |
1554 | 6.83M | { |
1555 | 6.83M | int cb_set = rv60_qp_to_idx[qp]; |
1556 | 6.83M | return get_vlc2(gb, cbp8_vlc[cb_set][subset], 9, 2); |
1557 | 6.83M | } |
1558 | | |
1559 | | static void decode_cu_8x8(GetBitContext * gb, int is_intra, int qp, int sel_qp, int16_t * y_coeffs, int16_t * u_coeffs, int16_t * v_coeffs, int ccbp, int mode4x4) |
1560 | 6.66M | { |
1561 | 6.66M | int cb_set = get_c4x4_set(sel_qp, is_intra); |
1562 | 6.66M | const CoeffVLCs * vlc = is_intra ? &intra_coeff_vlc[cb_set] : &inter_coeff_vlc[cb_set]; |
1563 | 6.66M | int q_y = rv60_quants_b[qp]; |
1564 | 6.66M | int q_c_dc = rv60_quants_b[rv60_chroma_quant_dc[qp]]; |
1565 | 6.66M | int q_c_ac = rv60_quants_b[rv60_chroma_quant_ac[qp]]; |
1566 | | |
1567 | 6.66M | memset(y_coeffs, 0, sizeof(y_coeffs[0])*64); |
1568 | 33.3M | for (int i = 0; i < 4; i++) { |
1569 | 26.6M | if ((ccbp >> i) & 1) { |
1570 | 13.9M | int offset, stride; |
1571 | 13.9M | if (mode4x4) { |
1572 | 4.42M | offset = i*16; |
1573 | 4.42M | stride = 4; |
1574 | 9.54M | } else { |
1575 | 9.54M | offset = (i & 1) * 4 + (i & 2) * 2 * 8; |
1576 | 9.54M | stride = 8; |
1577 | 9.54M | } |
1578 | 13.9M | decode_4x4_block(gb, vlc, 1, y_coeffs + offset, stride, q_y); |
1579 | 13.9M | } |
1580 | 26.6M | } |
1581 | | |
1582 | 6.66M | if ((ccbp >> 4) & 1) { |
1583 | 3.74M | memset(u_coeffs, 0, sizeof(u_coeffs[0])*16); |
1584 | 3.74M | decode_4x4_block_dc(gb, vlc, 0, u_coeffs, 4, q_c_dc, q_c_ac); |
1585 | 3.74M | } |
1586 | | |
1587 | 6.66M | if ((ccbp >> 5) & 1) { |
1588 | 3.74M | memset(v_coeffs, 0, sizeof(u_coeffs[0])*16); |
1589 | 3.74M | decode_4x4_block_dc(gb, vlc, 0, v_coeffs, 4, q_c_dc, q_c_ac); |
1590 | 3.74M | } |
1591 | 6.66M | } |
1592 | | |
1593 | | static void decode_cu_16x16(GetBitContext * gb, int is_intra, int qp, int sel_qp, int16_t * y_coeffs, int16_t * u_coeffs, int16_t * v_coeffs, int ccbp) |
1594 | 1.69M | { |
1595 | 1.69M | int cb_set = get_c4x4_set(sel_qp, is_intra); |
1596 | 1.69M | const CoeffVLCs * vlc = is_intra ? &intra_coeff_vlc[cb_set] : &inter_coeff_vlc[cb_set]; |
1597 | 1.69M | int q_y = rv60_quants_b[qp]; |
1598 | 1.69M | int q_c_dc = rv60_quants_b[rv60_chroma_quant_dc[qp]]; |
1599 | 1.69M | int q_c_ac = rv60_quants_b[rv60_chroma_quant_ac[qp]]; |
1600 | | |
1601 | 1.69M | memset(y_coeffs, 0, sizeof(y_coeffs[0])*256); |
1602 | 28.7M | for (int i = 0; i < 16; i++) |
1603 | 27.0M | if ((ccbp >> i) & 1) { |
1604 | 5.83M | int off = (i & 3) * 4 + (i >> 2) * 4 * 16; |
1605 | 5.83M | decode_4x4_block(gb, vlc, 1, y_coeffs + off, 16, q_y); |
1606 | 5.83M | } |
1607 | | |
1608 | 1.69M | memset(u_coeffs, 0, sizeof(u_coeffs[0])*64); |
1609 | 8.46M | for (int i = 0; i < 4; i++) |
1610 | 6.77M | if ((ccbp >> (16 + i)) & 1) { |
1611 | 805k | int off = (i & 1) * 4 + (i & 2) * 2 * 8; |
1612 | 805k | if (!i) |
1613 | 677k | decode_4x4_block_dc(gb, vlc, 0, u_coeffs + off, 8, q_c_dc, q_c_ac); |
1614 | 127k | else |
1615 | 127k | decode_4x4_block(gb, vlc, 0, u_coeffs + off, 8, q_c_ac); |
1616 | 805k | } |
1617 | | |
1618 | 1.69M | memset(v_coeffs, 0, sizeof(v_coeffs[0])*64); |
1619 | 8.46M | for (int i = 0; i < 4; i++) |
1620 | 6.77M | if ((ccbp >> (20 + i)) & 1) { |
1621 | 572k | int off = (i & 1) * 4 + (i & 2) * 2 * 8; |
1622 | 572k | if (!i) |
1623 | 473k | decode_4x4_block_dc(gb, vlc, 0, v_coeffs + off, 8, q_c_dc, q_c_ac); |
1624 | 99.5k | else |
1625 | 99.5k | decode_4x4_block(gb, vlc, 0, v_coeffs + off, 8, q_c_ac); |
1626 | 572k | } |
1627 | 1.69M | } |
1628 | | |
1629 | | static int decode_super_cbp(GetBitContext * gb, const VLCElem * vlc[4]) |
1630 | 1.69M | { |
1631 | 1.69M | int sym0 = get_vlc2(gb, vlc[0], 9, 2); |
1632 | 1.69M | int sym1 = get_vlc2(gb, vlc[1], 9, 2); |
1633 | 1.69M | int sym2 = get_vlc2(gb, vlc[2], 9, 2); |
1634 | 1.69M | int sym3 = get_vlc2(gb, vlc[3], 9, 2); |
1635 | 1.69M | return 0 |
1636 | 1.69M | + ((sym0 & 0x03) << 0) |
1637 | 1.69M | + ((sym0 & 0x0C) << 2) |
1638 | 1.69M | + ((sym0 & 0x10) << 12) |
1639 | 1.69M | + ((sym0 & 0x20) << 15) |
1640 | 1.69M | + ((sym1 & 0x03) << 2) |
1641 | 1.69M | + ((sym1 & 0x0C) << 4) |
1642 | 1.69M | + ((sym1 & 0x10) << 13) |
1643 | 1.69M | + ((sym1 & 0x20) << 16) |
1644 | 1.69M | + ((sym2 & 0x03) << 8) |
1645 | 1.69M | + ((sym2 & 0x0C) << 10) |
1646 | 1.69M | + ((sym2 & 0x10) << 14) |
1647 | 1.69M | + ((sym2 & 0x20) << 17) |
1648 | 1.69M | + ((sym3 & 0x03) << 10) |
1649 | 1.69M | + ((sym3 & 0x0C) << 12) |
1650 | 1.69M | + ((sym3 & 0x10) << 15) |
1651 | 1.69M | + ((sym3 & 0x20) << 18); |
1652 | 1.69M | } |
1653 | | |
1654 | | static int decode_cbp16(GetBitContext * gb, int subset, int qp) |
1655 | 1.69M | { |
1656 | 1.69M | int cb_set = rv60_qp_to_idx[qp]; |
1657 | 1.69M | return decode_super_cbp(gb, cbp16_vlc[cb_set][subset]); |
1658 | 1.69M | } |
1659 | | |
1660 | | static int decode_cu_r(RV60Context * s, AVFrame * frame, ThreadContext * thread, GetBitContext * gb, int xpos, int ypos, int log_size, int qp, int sel_qp) |
1661 | 17.0M | { |
1662 | 17.0M | int size = 1 << log_size; |
1663 | 17.0M | int split, ret, ttype, count, is_intra, cu_pos, subset, cbp8, imode, split_i4x4, num_clusters, cl_cbp, super_cbp, mv_x, mv_y, mv_pos; |
1664 | 17.0M | int16_t y_coeffs[16*16], u_coeffs[8*8], v_coeffs[8*8]; |
1665 | 17.0M | CUContext cu; |
1666 | | |
1667 | 17.0M | if (xpos >= s->awidth || ypos >= s->aheight) |
1668 | 738k | return 0; |
1669 | | |
1670 | 16.3M | split = xpos + size > s->awidth || ypos + size > s->aheight || (size > 8 && get_bits1(gb)); |
1671 | 16.3M | thread->cu_split[thread->cu_split_pos++] = split; |
1672 | 16.3M | if (split) { |
1673 | 4.17M | size >>= 1; |
1674 | 4.17M | log_size -= 1; |
1675 | 4.17M | if ((ret = decode_cu_r(s, frame, thread, gb, xpos, ypos, log_size, qp, sel_qp)) < 0 || |
1676 | 3.95M | (ret = decode_cu_r(s, frame, thread, gb, xpos + size, ypos, log_size, qp, sel_qp)) < 0 || |
1677 | 3.95M | (ret = decode_cu_r(s, frame, thread, gb, xpos, ypos + size, log_size, qp, sel_qp)) < 0 || |
1678 | 3.95M | (ret = decode_cu_r(s, frame, thread, gb, xpos + size, ypos + size, log_size, qp, sel_qp)) < 0) |
1679 | 224k | return ret; |
1680 | 3.94M | return 0; |
1681 | 4.17M | } |
1682 | | |
1683 | 12.1M | cu.xpos = xpos; |
1684 | 12.1M | cu.ypos = ypos; |
1685 | 12.1M | cu.pu_pos = (xpos >> 3) + (ypos >> 3) * s->pu_stride; |
1686 | 12.1M | cu.blk_pos = (xpos >> 2) + (ypos >> 2) * s->blk_stride; |
1687 | 12.1M | cu.cu_type = s->pict_type != AV_PICTURE_TYPE_I ? get_bits(gb, 2) : CU_INTRA; |
1688 | | |
1689 | 12.1M | switch (cu.cu_type) { |
1690 | 3.36M | case CU_INTRA: |
1691 | 3.36M | cu.pu_type = size == 8 && get_bits1(gb) ? PU_QUARTERS : PU_FULL; |
1692 | 3.36M | if (cu.pu_type == PU_QUARTERS) |
1693 | 10.9M | for (int i = 0; i < 4; i++) |
1694 | 8.79M | cu.imode[i] = read_intra_mode(gb, &cu.imode_param[i]); |
1695 | 1.16M | else if (size <= 32) |
1696 | 722k | cu.imode[0] = read_intra_mode(gb, &cu.imode_param[0]); |
1697 | 439k | else |
1698 | 439k | cu.imode[0] = get_bits1(gb) ? INTRAMODE_PLANE64 : INTRAMODE_DC64; |
1699 | 3.36M | break; |
1700 | 253k | case CU_INTER_MV: |
1701 | 253k | cu.pu_type = get_bits(gb, size == 8 ? 2 : 3); |
1702 | 253k | count = pu_type_num_parts(cu.pu_type); |
1703 | 895k | for (int i = 0; i < count; i++) |
1704 | 641k | read_mv_info(s, gb, &cu.mv[i], size, cu.pu_type); |
1705 | 253k | break; |
1706 | 8.51M | default: |
1707 | 8.51M | cu.pu_type = PU_FULL; |
1708 | 8.51M | cu.mv[0].mvref = skip_mv_ref[get_unary(gb, 0, 3)]; |
1709 | 8.51M | break; |
1710 | 12.1M | } |
1711 | | |
1712 | 12.1M | reconstruct(s, &cu, size); |
1713 | | |
1714 | 12.1M | split_i4x4 = cu.cu_type == CU_INTRA && size == 8 && cu.pu_type == PU_QUARTERS; |
1715 | | |
1716 | 12.1M | switch (cu.cu_type) { |
1717 | 3.36M | case CU_INTRA: |
1718 | 3.36M | imode = s->blk_info[cu.blk_pos].imode; |
1719 | 3.36M | if (!split_i4x4) { |
1720 | 1.16M | int off = ypos * frame->linesize[0] + xpos; |
1721 | 1.16M | populate_ipred(s, &cu, frame->data[0], frame->linesize[0], 0, 0, size, 1); |
1722 | 1.16M | if (pred_angle(&cu.ipred, frame->data[0] + off, frame->linesize[0], size, imode, 1) < 0) |
1723 | 0 | return AVERROR_INVALIDDATA; |
1724 | 1.16M | } |
1725 | 10.0M | for (int plane = 1; plane < 3; plane++) { |
1726 | 6.72M | int off = (ypos >> 1) * frame->linesize[plane] + (xpos >> 1); |
1727 | 6.72M | populate_ipred(s, &cu, frame->data[plane], frame->linesize[plane], 0, 0, size >> 1, 0); |
1728 | 6.72M | if (pred_angle(&cu.ipred, frame->data[plane] + off, frame->linesize[plane], size >> 1, imode, 0) < 0) |
1729 | 0 | return AVERROR_INVALIDDATA; |
1730 | 6.72M | } |
1731 | 3.36M | break; |
1732 | 8.76M | default: |
1733 | 8.76M | mv_x = xpos >> 2; |
1734 | 8.76M | mv_y = ypos >> 2; |
1735 | 8.76M | mv_pos = mv_y * s->blk_stride + mv_x; |
1736 | 8.76M | count = pu_type_num_parts(cu.pu_type); |
1737 | 17.8M | for (int part_no = 0; part_no < count; part_no++) { |
1738 | 9.14M | MVInfo mv; |
1739 | 9.14M | Dimensions dim; |
1740 | 9.14M | int bw, bh, bx, by; |
1741 | | |
1742 | 9.14M | mv = s->blk_info[mv_pos].mv; |
1743 | 9.14M | get_mv_dimensions(&dim, cu.pu_type, part_no, size); |
1744 | 9.14M | bw = dim.w << 2; |
1745 | 9.14M | bh = dim.h << 2; |
1746 | 9.14M | bx = mv_x << 2; |
1747 | 9.14M | by = mv_y << 2; |
1748 | | |
1749 | 9.14M | if (!(mv.mvref & 2)) { |
1750 | 8.97M | if (!s->last_frame[LAST_PIC]->data[0]) { |
1751 | 13.8k | av_log(s->avctx, AV_LOG_ERROR, "missing reference frame\n"); |
1752 | 13.8k | return AVERROR_INVALIDDATA; |
1753 | 13.8k | } |
1754 | 8.97M | } |
1755 | 9.13M | if (mv.mvref & 6) { |
1756 | 314k | if (!s->last_frame[NEXT_PIC]->data[0]) { |
1757 | 4.59k | av_log(s->avctx, AV_LOG_ERROR, "missing reference frame\n"); |
1758 | 4.59k | return AVERROR_INVALIDDATA; |
1759 | 4.59k | } |
1760 | 314k | } |
1761 | | |
1762 | 9.12M | switch (mv.mvref) { |
1763 | 8.81M | case MVREF_REF0: |
1764 | 8.81M | mc(s, frame->data, frame->linesize, s->last_frame[LAST_PIC], bx, by, bw, bh, mv.f_mv, 0); |
1765 | 8.81M | break; |
1766 | 6.72k | case MVREF_REF1: |
1767 | 6.72k | mc(s, frame->data, frame->linesize, s->last_frame[NEXT_PIC], bx, by, bw, bh, mv.f_mv, 0); |
1768 | 6.72k | break; |
1769 | 156k | case MVREF_BREF: |
1770 | 156k | mc(s, frame->data, frame->linesize, s->last_frame[NEXT_PIC], bx, by, bw, bh, mv.b_mv, 0); |
1771 | 156k | break; |
1772 | 146k | case MVREF_REF0ANDBREF: |
1773 | 146k | mc(s, frame->data, frame->linesize, s->last_frame[LAST_PIC], bx, by, bw, bh, mv.f_mv, 0); |
1774 | 146k | mc(s, thread->avg_data, thread->avg_linesize, s->last_frame[NEXT_PIC], bx, by, bw, bh, mv.b_mv, 1); |
1775 | 146k | avg(frame, thread->avg_data, thread->avg_linesize, bx, by, bw, bh); |
1776 | 146k | break; |
1777 | 0 | default: |
1778 | 0 | av_assert0(0); //should never reach here |
1779 | 9.12M | } |
1780 | 9.12M | get_next_mv(s, &dim, cu.pu_type, part_no, &mv_pos, &mv_x, &mv_y); |
1781 | 9.12M | } |
1782 | 8.75M | break; |
1783 | 12.1M | } |
1784 | | |
1785 | 12.1M | if (cu.cu_type == CU_SKIP) |
1786 | 3.98M | ttype = TRANSFORM_NONE; |
1787 | 8.12M | else if (size >= 32) |
1788 | 811k | ttype = TRANSFORM_16X16; |
1789 | 7.31M | else if (size == 16) |
1790 | 417k | ttype = cu.cu_type == CU_INTRA || cu.pu_type == PU_FULL ? TRANSFORM_16X16 : TRANSFORM_4X4; |
1791 | 6.89M | else |
1792 | 6.89M | ttype = cu.pu_type == PU_FULL ? TRANSFORM_8X8 : TRANSFORM_4X4; |
1793 | | |
1794 | 12.1M | is_intra = cu.cu_type == CU_INTRA; |
1795 | 12.1M | if (qp >= 32) |
1796 | 72.1k | return AVERROR_INVALIDDATA; |
1797 | 12.0M | cu_pos = ((xpos & 63) >> 3) + ((ypos & 63) >> 3) * 8; |
1798 | | |
1799 | 12.0M | switch (ttype) { |
1800 | 2.23M | case TRANSFORM_4X4: |
1801 | 2.23M | subset = is_intra ? 0 : 2; |
1802 | 2.23M | if (size == 16) { |
1803 | 28.8k | int cbp16 = get_bits1(gb) ? decode_cbp16(gb, subset, sel_qp) : 0; |
1804 | 28.8k | if (cbp16) { |
1805 | 2.91k | decode_cu_4x4in16x16(gb, is_intra, qp, sel_qp, y_coeffs, u_coeffs, v_coeffs, cbp16); |
1806 | 14.5k | for (int y = 0; y < 4; y++) |
1807 | 58.3k | for (int x = 0; x < 4; x++) { |
1808 | 46.6k | int i = y*4 + x; |
1809 | 46.6k | if ((cbp16 >> i) & 1) { |
1810 | 21.2k | int off = (ypos + y * 4)*frame->linesize[0] + xpos + x * 4; |
1811 | 21.2k | ff_rv60_idct4x4_add(y_coeffs + i*16, frame->data[0] + off, frame->linesize[0]); |
1812 | 21.2k | thread->coded_blk[cu_pos + (y/2)*8 + (x/2)] = 1; |
1813 | 21.2k | } |
1814 | 46.6k | } |
1815 | 8.74k | for (int y = 0; y < 2; y++) |
1816 | 17.4k | for (int x = 0; x < 2; x++) { |
1817 | 11.6k | int i = y * 2 + x; |
1818 | 11.6k | int xoff = (xpos >> 1) + x * 4; |
1819 | 11.6k | int yoff = (ypos >> 1) + y * 4; |
1820 | 11.6k | if ((cbp16 >> (16 + i)) & 1) { |
1821 | 2.15k | int off = yoff * frame->linesize[1] + xoff; |
1822 | 2.15k | ff_rv60_idct4x4_add(u_coeffs + i * 16, frame->data[1] + off, frame->linesize[1]); |
1823 | 2.15k | thread->coded_blk[cu_pos + y*8 + x] = 1; |
1824 | 2.15k | } |
1825 | 11.6k | if ((cbp16 >> (20 + i)) & 1) { |
1826 | 1.18k | int off = yoff * frame->linesize[2] + xoff; |
1827 | 1.18k | ff_rv60_idct4x4_add(v_coeffs + i * 16, frame->data[2] + off, frame->linesize[2]); |
1828 | 1.18k | thread->coded_blk[cu_pos + y*8 + x] = 1; |
1829 | 1.18k | } |
1830 | 11.6k | } |
1831 | 2.91k | } |
1832 | 2.20M | } else { |
1833 | 2.20M | cbp8 = decode_cbp8(gb, subset, sel_qp); |
1834 | 2.20M | if (cbp8) { |
1835 | 2.11M | thread->coded_blk[cu_pos] = 1; |
1836 | 2.11M | decode_cu_8x8(gb, is_intra, qp, sel_qp, y_coeffs, u_coeffs, v_coeffs, cbp8, 1); |
1837 | 2.11M | } |
1838 | 11.0M | for (int i = 0; i < 4; i++) { |
1839 | 8.83M | int xoff = (i & 1) << 2; |
1840 | 8.83M | int yoff = (i & 2) << 1; |
1841 | 8.83M | if (split_i4x4) { |
1842 | 8.54M | int off = (ypos + yoff) * frame->linesize[0] + xpos + xoff; |
1843 | 8.54M | int imode = s->blk_info[cu.blk_pos + (i >> 1) * s->blk_stride + (i & 1)].imode; |
1844 | 8.54M | populate_ipred(s, &cu, frame->data[0], frame->linesize[0], xoff, yoff, 4, 1); |
1845 | 8.54M | if (pred_angle(&cu.ipred, frame->data[0] + off, frame->linesize[0], 4, imode, 1) < 0) |
1846 | 0 | return AVERROR_INVALIDDATA; |
1847 | 8.54M | } |
1848 | 8.83M | if ((cbp8 >> i) & 1) { |
1849 | 4.42M | int off = (ypos + yoff) * frame->linesize[0] + xpos + xoff; |
1850 | 4.42M | ff_rv60_idct4x4_add(y_coeffs + i * 16, frame->data[0] + off, frame->linesize[0]); |
1851 | 4.42M | } |
1852 | 8.83M | } |
1853 | 2.20M | if ((cbp8 >> 4) & 1) { |
1854 | 1.53M | int off = (ypos >> 1) * frame->linesize[1] + (xpos >> 1); |
1855 | 1.53M | ff_rv60_idct4x4_add(u_coeffs, frame->data[1] + off, frame->linesize[1]); |
1856 | 1.53M | } |
1857 | 2.20M | if ((cbp8 >> 5) & 1) { |
1858 | 1.54M | int off = (ypos >> 1) * frame->linesize[2] + (xpos >> 1); |
1859 | 1.54M | ff_rv60_idct4x4_add(v_coeffs, frame->data[2] + off, frame->linesize[2]); |
1860 | 1.54M | } |
1861 | 2.20M | } |
1862 | 2.23M | break; |
1863 | 4.62M | case TRANSFORM_8X8: |
1864 | 4.62M | subset = is_intra ? 1 : 3; |
1865 | 4.62M | cbp8 = decode_cbp8(gb, subset, sel_qp); |
1866 | 4.62M | if (cbp8) { |
1867 | 4.55M | thread->coded_blk[cu_pos] = 1; |
1868 | 4.55M | decode_cu_8x8(gb, is_intra, qp, sel_qp, y_coeffs, u_coeffs, v_coeffs, cbp8, 0); |
1869 | 4.55M | if (cbp8 & 0xF) { |
1870 | 4.52M | int off = ypos * frame->linesize[0] + xpos; |
1871 | 4.52M | ff_rv60_idct8x8_add(y_coeffs, frame->data[0] + off, frame->linesize[0]); |
1872 | 4.52M | } |
1873 | 4.55M | if ((cbp8 >> 4) & 1) { |
1874 | 2.20M | int off = (ypos >> 1) * frame->linesize[1] + (xpos >> 1); |
1875 | 2.20M | ff_rv60_idct4x4_add(u_coeffs, frame->data[1] + off, frame->linesize[1]); |
1876 | 2.20M | } |
1877 | 4.55M | if ((cbp8 >> 5) & 1) { |
1878 | 2.20M | int off = (ypos >> 1) * frame->linesize[2] + (xpos >> 1); |
1879 | 2.20M | ff_rv60_idct4x4_add(v_coeffs, frame->data[2] + off, frame->linesize[2]); |
1880 | 2.20M | } |
1881 | 4.55M | } |
1882 | 4.62M | break; |
1883 | 1.19M | case TRANSFORM_16X16: |
1884 | 1.19M | subset = is_intra ? 1 : 3; |
1885 | 1.19M | num_clusters = size >> 4; |
1886 | 1.19M | cl_cbp = get_bits(gb, num_clusters * num_clusters); |
1887 | 4.26M | for (int y = 0; y < num_clusters; y++) { |
1888 | 13.1M | for (int x = 0; x < num_clusters; x++) { |
1889 | 10.0M | if (!((cl_cbp >> (y*num_clusters + x)) & 1)) |
1890 | 8.38M | continue; |
1891 | 1.69M | thread->coded_blk[cu_pos + y*2*8 + x*2 + 0] = 1; |
1892 | 1.69M | thread->coded_blk[cu_pos + y*2*8 + x*2 + 1] = 1; |
1893 | 1.69M | thread->coded_blk[cu_pos + y*2*8 + x*2 + 8] = 1; |
1894 | 1.69M | thread->coded_blk[cu_pos + y*2*8 + x*2 + 9] = 1; |
1895 | 1.69M | super_cbp = decode_cbp16(gb, subset, sel_qp); |
1896 | 1.69M | if (super_cbp) { |
1897 | 1.69M | decode_cu_16x16(gb, is_intra, qp, sel_qp, y_coeffs, u_coeffs, v_coeffs, super_cbp); |
1898 | 1.69M | if (super_cbp & 0xFFFF) { |
1899 | 1.69M | int off = (ypos + y * 16) * frame->linesize[0] + xpos + x * 16; |
1900 | 1.69M | ff_rv60_idct16x16_add(y_coeffs, frame->data[0] + off, frame->linesize[0]); |
1901 | 1.69M | } |
1902 | 1.69M | if ((super_cbp >> 16) & 0xF) { |
1903 | 702k | int off = ((ypos >> 1) + y * 8) * frame->linesize[1] + (xpos >> 1) + x * 8; |
1904 | 702k | ff_rv60_idct8x8_add(u_coeffs, frame->data[1] + off, frame->linesize[1]); |
1905 | 702k | } |
1906 | 1.69M | if ((super_cbp >> 20) & 0xF) { |
1907 | 496k | int off = ((ypos >> 1) + y * 8) * frame->linesize[2] + (xpos >> 1) + x * 8; |
1908 | 496k | ff_rv60_idct8x8_add(v_coeffs, frame->data[2] + off, frame->linesize[2]); |
1909 | 496k | } |
1910 | 1.69M | } |
1911 | 1.69M | } |
1912 | 3.07M | } |
1913 | 1.19M | break; |
1914 | 12.0M | } |
1915 | | |
1916 | 12.0M | return 0; |
1917 | 12.0M | } |
1918 | | |
1919 | | static int deblock_get_pos(RV60Context * s, int xpos, int ypos) |
1920 | 36.3M | { |
1921 | 36.3M | return (ypos >> 2) * s->dblk_stride + (xpos >> 2); |
1922 | 36.3M | } |
1923 | | |
1924 | | static void deblock_set_strength(RV60Context * s, int xpos, int ypos, int size, int q, int strength) |
1925 | 15.9M | { |
1926 | 15.9M | int pos = deblock_get_pos(s, xpos, ypos); |
1927 | 15.9M | int dsize = size >> 2; |
1928 | 15.9M | int dval = (q << 2) + strength; |
1929 | | |
1930 | 64.5M | for (int x = 0; x < dsize; x++) { |
1931 | 48.5M | s->top_str[pos + x] = dval; |
1932 | 48.5M | s->top_str[pos + (dsize - 1)*s->dblk_stride + x] = dval; |
1933 | 48.5M | } |
1934 | | |
1935 | 64.5M | for (int y = 0; y < dsize; y++) { |
1936 | 48.5M | s->left_str[pos + y*s->dblk_stride] = dval; |
1937 | 48.5M | s->left_str[pos + y*s->dblk_stride + dsize - 1] = dval; |
1938 | 48.5M | } |
1939 | 15.9M | } |
1940 | | |
1941 | | static int deblock_get_top_strength(const RV60Context * s, int pos) |
1942 | 10.4M | { |
1943 | 10.4M | return s->top_str[pos] & 3; |
1944 | 10.4M | } |
1945 | | |
1946 | | static int deblock_get_left_strength(const RV60Context * s, int pos) |
1947 | 10.8M | { |
1948 | 10.8M | return s->left_str[pos] & 3; |
1949 | 10.8M | } |
1950 | | |
1951 | | static void deblock_set_top_strength(RV60Context * s, int pos, int strength) |
1952 | 700k | { |
1953 | 700k | s->top_str[pos] |= strength; |
1954 | 700k | } |
1955 | | |
1956 | | static void deblock_set_left_strength(RV60Context * s, int pos, int strength) |
1957 | 611k | { |
1958 | 611k | s->left_str[pos] |= strength; |
1959 | 611k | } |
1960 | | |
1961 | | static void derive_deblock_strength(RV60Context * s, int xpos, int ypos, int size) |
1962 | 4.42M | { |
1963 | 4.42M | int blk_pos = (ypos >> 2) * s->blk_stride + (xpos >> 2); |
1964 | 4.42M | int dblk_pos = deblock_get_pos(s, xpos, ypos); |
1965 | 4.42M | if (ypos > 0) |
1966 | 14.7M | for (int i = 0; i < size; i++) |
1967 | 10.4M | if (!deblock_get_top_strength(s, dblk_pos - s->dblk_stride + i) && mvinfo_is_deblock_cand(&s->blk_info[blk_pos + i].mv, &s->blk_info[blk_pos - s->blk_stride + i].mv)) |
1968 | 700k | deblock_set_top_strength(s, dblk_pos + i, 1); |
1969 | 4.42M | if (xpos > 0) |
1970 | 15.1M | for (int i = 0; i < size; i++) |
1971 | 10.8M | if (!deblock_get_left_strength(s, dblk_pos + i *s->dblk_stride - 1) && mvinfo_is_deblock_cand(&s->blk_info[blk_pos + i*s->blk_stride].mv, &s->blk_info[blk_pos + i*s->blk_stride - 1].mv)) |
1972 | 611k | deblock_set_left_strength(s, dblk_pos + i *s->dblk_stride, 1); |
1973 | 4.42M | } |
1974 | | |
1975 | 221M | #define STRENGTH(el, lim) (FFABS(el) < (lim) ? 3 : 1) |
1976 | 134M | #define CLIP_SYMM(a, b) av_clip(a, -(b), b) |
1977 | | |
1978 | | static void filter_luma_edge(uint8_t * dst, int step, int stride, int mode1, int mode2, int lim1, int lim2) |
1979 | 74.4M | { |
1980 | 74.4M | int16_t diff_q1q0[4]; |
1981 | 74.4M | int16_t diff_p1p0[4]; |
1982 | 74.4M | int str_p, str_q, msum, maxprod, weak; |
1983 | | |
1984 | 372M | for (int i = 0; i < 4; i++) { |
1985 | 297M | diff_q1q0[i] = dst[i * stride - 2*step] - dst[i*stride - step]; |
1986 | 297M | diff_p1p0[i] = dst[i * stride + step] - dst[i*stride]; |
1987 | 297M | } |
1988 | | |
1989 | 74.4M | str_p = STRENGTH(diff_q1q0[0] + diff_q1q0[1] + diff_q1q0[2] + diff_q1q0[3], lim2); |
1990 | 74.4M | str_q = STRENGTH(diff_p1p0[0] + diff_p1p0[1] + diff_p1p0[2] + diff_p1p0[3], lim2); |
1991 | | |
1992 | 74.4M | if (str_p + str_q <= 2) |
1993 | 10.2M | return; |
1994 | | |
1995 | 64.2M | msum = (mode1 + mode2 + str_q + str_p) >> 1; |
1996 | 64.2M | if (str_q == 1 || str_p == 1) { |
1997 | 6.33M | maxprod = 384; |
1998 | 6.33M | weak = 1; |
1999 | 57.9M | } else { |
2000 | 57.9M | maxprod = 256; |
2001 | 57.9M | weak = 0; |
2002 | 57.9M | } |
2003 | | |
2004 | 321M | for (int y = 0; y < 4; y++) { |
2005 | 256M | int diff_p0q0 = dst[0] - dst[-step]; |
2006 | 256M | int result = (lim1 * FFABS(diff_p0q0)) & -128; |
2007 | 256M | if (diff_p0q0 && result <= maxprod) { |
2008 | 44.6M | int diff_q1q2 = dst[-2*step] - dst[-3*step]; |
2009 | 44.6M | int diff_p1p2 = dst[step] - dst[2*step]; |
2010 | 44.6M | int delta; |
2011 | 44.6M | if (weak) { |
2012 | 7.03M | delta = CLIP_SYMM((diff_p0q0 + 1) >> 1, msum >> 1); |
2013 | 37.6M | } else { |
2014 | 37.6M | int diff_strg = (dst[-2*step] - dst[step] + 4 * diff_p0q0 + 4) >> 3; |
2015 | 37.6M | delta = CLIP_SYMM(diff_strg, msum); |
2016 | 37.6M | } |
2017 | 44.6M | dst[-step] = av_clip_uint8(dst[-step] + delta); |
2018 | 44.6M | dst[0] = av_clip_uint8(dst[0] - delta); |
2019 | 44.6M | if (str_p != 1 && FFABS(diff_q1q2) <= (lim2 >> 2)) { |
2020 | 39.0M | int diff = (diff_q1q0[y] + diff_q1q2 - delta) >> 1; |
2021 | 39.0M | int delta_q1 = weak ? CLIP_SYMM(diff, mode1 >> 1) : CLIP_SYMM(diff, mode1); |
2022 | 39.0M | dst[-2 * step] = av_clip_uint8(dst[-2*step] - delta_q1); |
2023 | 39.0M | } |
2024 | 44.6M | if (str_q != 1 && FFABS(diff_p1p2) <= (lim2 >> 2)) { |
2025 | 39.2M | int diff = (diff_p1p0[y] + diff_p1p2 + delta) >> 1; |
2026 | 39.2M | int delta_p1 = weak ? CLIP_SYMM(diff, mode2 >> 1) : CLIP_SYMM(diff, mode2); |
2027 | 39.2M | dst[step] = av_clip_uint8(dst[step] - delta_p1); |
2028 | 39.2M | } |
2029 | 44.6M | } |
2030 | 256M | dst += stride; |
2031 | 256M | } |
2032 | 64.2M | } |
2033 | | |
2034 | | static void filter_chroma_edge(uint8_t * dst, int step, int stride, int mode1, int mode2, int lim1, int lim2) |
2035 | 36.0M | { |
2036 | 36.0M | int diff_q = 4 * FFABS(dst[-2*step] - dst[-step]); |
2037 | 36.0M | int diff_p = 4 * FFABS(dst[ step] - dst[0]); |
2038 | 36.0M | int str_q = STRENGTH(diff_q, lim2); |
2039 | 36.0M | int str_p = STRENGTH(diff_p, lim2); |
2040 | 36.0M | int msum, maxprod, weak; |
2041 | | |
2042 | 36.0M | if (str_p + str_q <= 2) |
2043 | 4.21M | return; |
2044 | | |
2045 | 31.8M | msum = (mode1 + mode2 + str_q + str_p) >> 1; |
2046 | 31.8M | if (str_q == 1 || str_p == 1) { |
2047 | 1.50M | maxprod = 384; |
2048 | 1.50M | weak = 1; |
2049 | 30.3M | } else { |
2050 | 30.3M | maxprod = 256; |
2051 | 30.3M | weak = 0; |
2052 | 30.3M | } |
2053 | | |
2054 | 95.5M | for (int y = 0; y < 2; y++) { |
2055 | 63.6M | int diff_pq = dst[0] - dst[-step]; |
2056 | 63.6M | int result = (lim1 * FFABS(diff_pq)) & -128; |
2057 | 63.6M | if (diff_pq && result <= maxprod) { |
2058 | 11.2M | int delta; |
2059 | 11.2M | if (weak) { |
2060 | 792k | delta = CLIP_SYMM((diff_pq + 1) >> 1, msum >> 1); |
2061 | 10.4M | } else { |
2062 | 10.4M | int diff_strg = (dst[-2*step] - dst[step] + 4 * diff_pq + 4) >> 3; |
2063 | 10.4M | delta = CLIP_SYMM(diff_strg, msum); |
2064 | 10.4M | } |
2065 | 11.2M | dst[-step] = av_clip_uint8(dst[-step] + delta); |
2066 | 11.2M | dst[ 0 ] = av_clip_uint8(dst[ 0 ] - delta); |
2067 | 11.2M | } |
2068 | 63.6M | dst += stride; |
2069 | 63.6M | } |
2070 | 31.8M | } |
2071 | | |
2072 | | static void deblock_edge_ver(AVFrame * frame, int xpos, int ypos, int dblk_l, int dblk_r, int deblock_chroma) |
2073 | 40.0M | { |
2074 | 40.0M | int qp_l = dblk_l >> 2; |
2075 | 40.0M | int str_l = dblk_l & 3; |
2076 | 40.0M | int qp_r = dblk_r >> 2; |
2077 | 40.0M | int str_r = dblk_r & 3; |
2078 | 40.0M | const uint8_t * dl_l = rv60_deblock_limits[qp_l]; |
2079 | 40.0M | const uint8_t * dl_r = rv60_deblock_limits[qp_r]; |
2080 | 40.0M | int mode_l = str_l ? dl_l[str_l - 1] : 0; |
2081 | 40.0M | int mode_r = str_r ? dl_r[str_r - 1] : 0; |
2082 | 40.0M | int lim1 = dl_r[2]; |
2083 | 40.0M | int lim2 = dl_r[3] * 4; |
2084 | | |
2085 | 40.0M | filter_luma_edge(frame->data[0] + ypos * frame->linesize[0] + xpos, 1, frame->linesize[0], mode_l, mode_r, lim1, lim2); |
2086 | 40.0M | if ((str_l | str_r) >= 2 && deblock_chroma) |
2087 | 27.3M | for (int plane = 1; plane < 3; plane++) |
2088 | 18.2M | filter_chroma_edge(frame->data[plane] + (ypos >> 1) * frame->linesize[plane] + (xpos >> 1), 1, frame->linesize[plane], mode_l, mode_r, lim1, lim2); |
2089 | 40.0M | } |
2090 | | |
2091 | | static void deblock_edge_hor(AVFrame * frame, int xpos, int ypos, int dblk_t, int dblk_d, int deblock_chroma) |
2092 | 34.4M | { |
2093 | 34.4M | int qp_t = dblk_t >> 2; |
2094 | 34.4M | int str_t = dblk_t & 3; |
2095 | 34.4M | int qp_d = dblk_d >> 2; |
2096 | 34.4M | int str_d = dblk_d & 3; |
2097 | 34.4M | const uint8_t * dl_t = rv60_deblock_limits[qp_t]; |
2098 | 34.4M | const uint8_t * dl_d = rv60_deblock_limits[qp_d]; |
2099 | 34.4M | int mode_t = str_t ? dl_t[str_t - 1] : 0; |
2100 | 34.4M | int mode_d = str_d ? dl_d[str_d - 1] : 0; |
2101 | 34.4M | int lim1 = dl_d[2]; |
2102 | 34.4M | int lim2 = dl_d[3] * 4; |
2103 | | |
2104 | 34.4M | filter_luma_edge(frame->data[0] + ypos * frame->linesize[0] + xpos, frame->linesize[0], 1, mode_t, mode_d, lim1, lim2); |
2105 | 34.4M | if ((str_t | str_d) >= 2 && deblock_chroma) |
2106 | 26.7M | for (int plane = 1; plane < 3; plane++) |
2107 | 17.8M | filter_chroma_edge(frame->data[plane] + (ypos >> 1) * frame->linesize[plane] + (xpos >> 1), frame->linesize[plane], 1, mode_t, mode_d, lim1, lim2); |
2108 | 34.4M | } |
2109 | | |
2110 | | static void deblock8x8(const RV60Context * s, AVFrame * frame, int xpos, int ypos, int dblkpos) |
2111 | 32.6M | { |
2112 | 32.6M | if (xpos > 0) { |
2113 | 32.4M | if (ypos > 0) { |
2114 | 29.4M | int str_l = s->left_str[dblkpos - s->dblk_stride - 1]; |
2115 | 29.4M | int str_r = s->left_str[dblkpos - s->dblk_stride]; |
2116 | 29.4M | if ((str_l | str_r) & 3) |
2117 | 18.4M | deblock_edge_ver(frame, xpos, ypos - 4, str_l, str_r, s->deblock_chroma); |
2118 | 29.4M | } |
2119 | 32.4M | { |
2120 | 32.4M | int str_l = s->left_str[dblkpos - 1]; |
2121 | 32.4M | int str_r = s->left_str[dblkpos]; |
2122 | 32.4M | if ((str_l | str_r) & 3) |
2123 | 20.0M | deblock_edge_ver(frame, xpos, ypos, str_l, str_r, s->deblock_chroma); |
2124 | 32.4M | } |
2125 | 32.4M | if (ypos + 8 >= s->aheight) { |
2126 | 1.58M | int str_l = s->left_str[dblkpos + s->dblk_stride - 1]; |
2127 | 1.58M | int str_r = s->left_str[dblkpos + s->dblk_stride]; |
2128 | 1.58M | if ((str_l | str_r) & 3) |
2129 | 1.53M | deblock_edge_ver(frame, xpos, ypos + 4, str_l, str_r, s->deblock_chroma); |
2130 | 1.58M | } |
2131 | 32.4M | } |
2132 | 32.6M | if (ypos > 0) { |
2133 | 29.6M | if (xpos > 0) { |
2134 | 29.4M | int str_t = s->top_str[dblkpos - s->dblk_stride - 1]; |
2135 | 29.4M | int str_d = s->top_str[dblkpos - 1]; |
2136 | 29.4M | if ((str_t | str_d) & 3) |
2137 | 17.1M | deblock_edge_hor(frame, xpos - 4, ypos, str_t, str_d, s->deblock_chroma); |
2138 | 29.4M | } |
2139 | 29.6M | { |
2140 | 29.6M | int str_t = s->top_str[dblkpos - s->dblk_stride]; |
2141 | 29.6M | int str_d = s->top_str[dblkpos]; |
2142 | 29.6M | if ((str_t | str_d) & 3) |
2143 | 17.2M | deblock_edge_hor(frame, xpos, ypos, str_t, str_d, s->deblock_chroma); |
2144 | 29.6M | } |
2145 | 29.6M | if (xpos + 8 >= s->awidth) { |
2146 | 110k | int str_t = s->top_str[dblkpos - s->dblk_stride + 1]; |
2147 | 110k | int str_d = s->top_str[dblkpos + 1]; |
2148 | 110k | if ((str_t | str_d) & 3) |
2149 | 89.5k | deblock_edge_hor(frame, xpos + 4, ypos, str_t, str_d, s->deblock_chroma); |
2150 | 110k | } |
2151 | 29.6M | } |
2152 | 32.6M | } |
2153 | | |
2154 | | static void deblock(const RV60Context * s, AVFrame * frame, int xpos, int ypos, int size, int dpos) |
2155 | 15.9M | { |
2156 | 40.2M | for (int x = 0; x < size >> 3; x++) |
2157 | 24.2M | deblock8x8(s, frame, xpos + x * 8, ypos, dpos + x * 2); |
2158 | | |
2159 | 24.2M | for (int y = 1; y < size >> 3; y++) |
2160 | 8.34M | deblock8x8(s, frame, xpos, ypos + y * 8, dpos + y * 2 * s->dblk_stride); |
2161 | 15.9M | } |
2162 | | |
2163 | | static void deblock_cu_r(RV60Context * s, AVFrame * frame, ThreadContext * thread, int xpos, int ypos, int log_size, int qp) |
2164 | 11.5M | { |
2165 | 11.5M | int pu_pos, tsize, ntiles; |
2166 | 11.5M | enum CUType cu_type; |
2167 | | |
2168 | 11.5M | if (xpos >= s->awidth || ypos >= s->aheight) |
2169 | 423k | return; |
2170 | | |
2171 | 11.1M | if (thread->cu_split[thread->cu_split_pos++]) { |
2172 | 2.71M | int hsize = 1 << (log_size - 1); |
2173 | 2.71M | log_size--; |
2174 | 2.71M | deblock_cu_r(s, frame, thread, xpos, ypos, log_size, qp); |
2175 | 2.71M | deblock_cu_r(s, frame, thread, xpos + hsize, ypos, log_size, qp); |
2176 | 2.71M | deblock_cu_r(s, frame, thread, xpos, ypos + hsize, log_size, qp); |
2177 | 2.71M | deblock_cu_r(s, frame, thread, xpos + hsize, ypos + hsize, log_size, qp); |
2178 | 2.71M | return; |
2179 | 2.71M | } |
2180 | | |
2181 | 8.42M | pu_pos = (ypos >> 3) * s->pu_stride + (xpos >> 3); |
2182 | 8.42M | cu_type = s->pu_info[pu_pos].cu_type; |
2183 | 8.42M | switch (log_size) { |
2184 | 7.54M | case 3: tsize = 3; break; |
2185 | 258k | case 4: tsize = cu_type && s->pu_info[pu_pos].pu_type ? 3 : 4; break; |
2186 | 156k | case 5: |
2187 | 623k | case 6: tsize = 4; break; |
2188 | 8.42M | } |
2189 | 8.42M | ntiles = 1 << (log_size - tsize); |
2190 | | |
2191 | 18.4M | for (int ty = 0; ty < ntiles; ty++) |
2192 | 25.9M | for (int tx = 0; tx < ntiles; tx++) { |
2193 | 15.9M | int x = xpos + (tx << tsize); |
2194 | 15.9M | int y = ypos + (ty << tsize); |
2195 | 15.9M | int cu_pos = ((y & 63) >> 3) * 8 + ((x & 63) >> 3); |
2196 | | |
2197 | 15.9M | if (cu_type == CU_INTRA) |
2198 | 7.77M | deblock_set_strength(s, x, y, 1 << tsize, qp, 2); |
2199 | 8.17M | else if (cu_type != CU_SKIP && thread->coded_blk[cu_pos]) |
2200 | 3.75M | deblock_set_strength(s, x, y, 1 << tsize, qp, 1); |
2201 | 4.42M | else { |
2202 | 4.42M | deblock_set_strength(s, x, y, 1 << tsize, qp, 0); |
2203 | 4.42M | derive_deblock_strength(s, x, y, 1 << (tsize - 2)); |
2204 | 4.42M | } |
2205 | | |
2206 | 15.9M | deblock(s, frame, x, y, 1 << tsize, deblock_get_pos(s, x, y)); |
2207 | 15.9M | } |
2208 | 8.42M | } |
2209 | | |
2210 | | static int read_qp_offset(GetBitContext *gb, int qp_off_type) |
2211 | 1.01M | { |
2212 | 1.01M | int val; |
2213 | | |
2214 | 1.01M | switch (qp_off_type) { |
2215 | 548k | case 0: |
2216 | 548k | return 0; |
2217 | 353k | case 1: |
2218 | 353k | val = read_code012(gb); |
2219 | 353k | return val != 2 ? val : -1; |
2220 | 113k | default: |
2221 | 113k | if (!get_bits1(gb)) |
2222 | 70.5k | return 0; |
2223 | 43.2k | val = get_bits(gb, 2); |
2224 | 43.2k | if (!(val & 2)) |
2225 | 10.1k | return val + 1; |
2226 | 33.1k | else |
2227 | 33.1k | return -((val & 1) + 1); |
2228 | 1.01M | } |
2229 | 1.01M | } |
2230 | | |
2231 | | static int calc_sel_qp(int osvquant, int qp) |
2232 | 1.01M | { |
2233 | 1.01M | switch (osvquant) { |
2234 | 755k | case 0: return qp; |
2235 | 152k | case 1: return qp <= 25 ? qp + 5 : qp; |
2236 | 105k | default: |
2237 | 105k | if (qp <= 18) |
2238 | 86.8k | return qp + 10; |
2239 | 18.9k | else if (qp <= 25) |
2240 | 4.86k | return qp + 5; |
2241 | 14.0k | else |
2242 | 14.0k | return qp; |
2243 | 1.01M | } |
2244 | 1.01M | } |
2245 | | |
2246 | | static int decode_slice(AVCodecContext *avctx, void *tdata, int cu_y, int threadnr) |
2247 | 139k | { |
2248 | 139k | RV60Context *s = avctx->priv_data; |
2249 | 139k | AVFrame * frame = tdata; |
2250 | 139k | ThreadContext thread; |
2251 | 139k | GetBitContext gb; |
2252 | 139k | int qp, sel_qp, ret; |
2253 | | |
2254 | 139k | thread.avg_data[0] = thread.avg_buffer; |
2255 | 139k | thread.avg_data[1] = thread.avg_buffer + 64*64; |
2256 | 139k | thread.avg_data[2] = thread.avg_buffer + 64*64 + 32*32; |
2257 | 139k | thread.avg_linesize[0] = 64; |
2258 | 139k | thread.avg_linesize[1] = 32; |
2259 | 139k | thread.avg_linesize[2] = 32; |
2260 | | |
2261 | 139k | if ((ret = init_get_bits8(&gb, s->slice[cu_y].data, s->slice[cu_y].data_size)) < 0) |
2262 | 0 | return ret; |
2263 | | |
2264 | 1.06M | for (int cu_x = 0; cu_x < s->cu_width; cu_x++) { |
2265 | 1.01M | if ((s->avctx->active_thread_type & FF_THREAD_SLICE) && cu_y) |
2266 | 0 | ff_thread_progress_await(&s->progress[cu_y - 1], cu_x + 2); |
2267 | | |
2268 | 1.01M | qp = s->qp + read_qp_offset(&gb, s->qp_off_type); |
2269 | 1.01M | if (qp < 0 || qp >= 64) { |
2270 | 731 | ret = AVERROR_INVALIDDATA; |
2271 | 731 | break; |
2272 | 731 | } |
2273 | 1.01M | sel_qp = calc_sel_qp(s->osvquant, qp); |
2274 | | |
2275 | 1.01M | memset(thread.coded_blk, 0, sizeof(thread.coded_blk)); |
2276 | 1.01M | thread.cu_split_pos = 0; |
2277 | | |
2278 | 1.01M | if ((ret = decode_cu_r(s, frame, &thread, &gb, cu_x << 6, cu_y << 6, 6, qp, sel_qp)) < 0) |
2279 | 90.5k | break; |
2280 | | |
2281 | 923k | if (s->deblock) { |
2282 | 699k | thread.cu_split_pos = 0; |
2283 | 699k | deblock_cu_r(s, frame, &thread, cu_x << 6, cu_y << 6, 6, qp); |
2284 | 699k | } |
2285 | | |
2286 | 923k | if (s->avctx->active_thread_type & FF_THREAD_SLICE) |
2287 | 0 | ff_thread_progress_report(&s->progress[cu_y], cu_x + 1); |
2288 | 923k | } |
2289 | | |
2290 | 139k | if (s->avctx->active_thread_type & FF_THREAD_SLICE) |
2291 | 0 | ff_thread_progress_report(&s->progress[cu_y], INT_MAX); |
2292 | | |
2293 | 139k | return ret; |
2294 | 139k | } |
2295 | | |
2296 | | static int rv60_decode_frame(AVCodecContext *avctx, AVFrame * frame, |
2297 | | int * got_frame, AVPacket * avpkt) |
2298 | 262k | { |
2299 | 262k | RV60Context *s = avctx->priv_data; |
2300 | 262k | GetBitContext gb; |
2301 | 262k | int ret, header_size, width, height, ofs; |
2302 | | |
2303 | 262k | if (avpkt->size == 0) { |
2304 | 9.68k | if (s->last_frame[NEXT_PIC]->data[0]) { |
2305 | 4.15k | av_frame_move_ref(frame, s->last_frame[NEXT_PIC]); |
2306 | 4.15k | *got_frame = 1; |
2307 | 4.15k | } |
2308 | 9.68k | return 0; |
2309 | 9.68k | } |
2310 | | |
2311 | 252k | if (avpkt->size < 9) |
2312 | 67.3k | return AVERROR_INVALIDDATA; |
2313 | | |
2314 | 184k | header_size = avpkt->data[0] * 8 + 9; |
2315 | 184k | if (avpkt->size < header_size) |
2316 | 9.73k | return AVERROR_INVALIDDATA; |
2317 | | |
2318 | 175k | if ((ret = init_get_bits8(&gb, avpkt->data + header_size, avpkt->size - header_size)) < 0) |
2319 | 0 | return ret; |
2320 | | |
2321 | 175k | if ((ret = read_frame_header(s, &gb, &width, &height)) < 0) |
2322 | 22.3k | return ret; |
2323 | | |
2324 | 152k | if (avctx->skip_frame >= AVDISCARD_NONREF && s->pict_type == AV_PICTURE_TYPE_B || |
2325 | 138k | avctx->skip_frame >= AVDISCARD_NONKEY && s->pict_type != AV_PICTURE_TYPE_I || |
2326 | 137k | avctx->skip_frame >= AVDISCARD_ALL) |
2327 | 27.3k | return avpkt->size; |
2328 | | |
2329 | 125k | if (s->pict_type != AV_PICTURE_TYPE_B) |
2330 | 119k | FFSWAP(AVFrame *, s->last_frame[NEXT_PIC], s->last_frame[LAST_PIC]); |
2331 | | |
2332 | 125k | if ((s->pict_type == AV_PICTURE_TYPE_P && !s->last_frame[LAST_PIC]->data[0]) || |
2333 | 113k | (s->pict_type == AV_PICTURE_TYPE_B && (!s->last_frame[LAST_PIC]->data[0] || !s->last_frame[NEXT_PIC]->data[0]))) { |
2334 | 13.2k | av_log(s->avctx, AV_LOG_ERROR, "missing reference frame\n"); |
2335 | 13.2k | return AVERROR_INVALIDDATA; |
2336 | 13.2k | } |
2337 | | |
2338 | 112k | s->last_frame[CUR_PIC]->pict_type = s->pict_type; |
2339 | 112k | if (s->pict_type == AV_PICTURE_TYPE_I) |
2340 | 97.4k | s->last_frame[CUR_PIC]->flags |= AV_FRAME_FLAG_KEY; |
2341 | | |
2342 | 112k | if ((ret = update_dimensions_clear_info(s, width, height)) < 0) |
2343 | 8.42k | return ret; |
2344 | | |
2345 | 103k | if (!s->last_frame[CUR_PIC]->data[0]) |
2346 | 102k | if ((ret = ff_get_buffer(avctx, s->last_frame[CUR_PIC], 0)) < 0) |
2347 | 68 | return ret; |
2348 | | |
2349 | 103k | if ((ret = read_slice_sizes(s, &gb)) < 0) |
2350 | 6.66k | return ret; |
2351 | | |
2352 | 97.1k | ofs = get_bits_count(&gb) / 8; |
2353 | | |
2354 | 238k | for (int i = 0; i < s->cu_height; i++) { |
2355 | 142k | if (ofs >= avpkt->size - header_size) |
2356 | 912 | return AVERROR_INVALIDDATA; |
2357 | 141k | s->slice[i].data = avpkt->data + header_size + ofs; |
2358 | 141k | s->slice[i].data_size = FFMIN(s->slice[i].size, avpkt->size - header_size - ofs); |
2359 | 141k | if (s->slice[i].size > INT32_MAX - ofs) |
2360 | 232 | return AVERROR_INVALIDDATA; |
2361 | 141k | ofs += s->slice[i].size; |
2362 | 141k | } |
2363 | | |
2364 | 96.0k | ret = progress_init(s, s->cu_height); |
2365 | 96.0k | if (ret < 0) |
2366 | 0 | return ret; |
2367 | | |
2368 | 96.0k | s->avctx->execute2(s->avctx, decode_slice, s->last_frame[CUR_PIC], NULL, s->cu_height); |
2369 | | |
2370 | 96.0k | ret = 0; |
2371 | 96.0k | if (s->pict_type == AV_PICTURE_TYPE_B) |
2372 | 4.37k | av_frame_move_ref(frame, s->last_frame[CUR_PIC]); |
2373 | 91.6k | else if (s->last_frame[LAST_PIC]->data[0]) |
2374 | 52.5k | ret = av_frame_ref(frame, s->last_frame[LAST_PIC]); |
2375 | 96.0k | if (ret < 0) |
2376 | 0 | return ret; |
2377 | | |
2378 | 96.0k | if (frame->data[0]) |
2379 | 56.9k | *got_frame = 1; |
2380 | | |
2381 | 96.0k | if (s->pict_type != AV_PICTURE_TYPE_B) { |
2382 | 91.6k | av_frame_unref(s->last_frame[NEXT_PIC]); |
2383 | 91.6k | FFSWAP(AVFrame *, s->last_frame[CUR_PIC], s->last_frame[NEXT_PIC]); |
2384 | 91.6k | } |
2385 | | |
2386 | 96.0k | if (s->pict_type != AV_PICTURE_TYPE_B) { |
2387 | 91.6k | s->ref_pts[0] = s->ref_pts[1]; |
2388 | 91.6k | s->ref_pts[1] = avpkt->pts; |
2389 | | |
2390 | 91.6k | s->ref_ts[0] = s->ref_ts[1]; |
2391 | 91.6k | s->ref_ts[1] = s->ts; |
2392 | | |
2393 | 91.6k | if (s->ref_pts[1] > s->ref_pts[0] && s->ref_ts[1] > s->ref_ts[0]) |
2394 | 4.11k | s->ts_scale = (s->ref_pts[1] - s->ref_pts[0]) / (s->ref_ts[1] - s->ref_ts[0]); |
2395 | 91.6k | } else { |
2396 | 4.37k | frame->pts = s->ref_pts[0] + (s->ts - s->ref_ts[0]) * s->ts_scale; |
2397 | 4.37k | } |
2398 | | |
2399 | 96.0k | return avpkt->size; |
2400 | 96.0k | } |
2401 | | |
2402 | | static av_cold void rv60_flush(AVCodecContext *avctx) |
2403 | 65.8k | { |
2404 | 65.8k | RV60Context *s = avctx->priv_data; |
2405 | | |
2406 | 263k | for (int i = 0; i < 3; i++) |
2407 | 197k | av_frame_unref(s->last_frame[i]); |
2408 | 65.8k | } |
2409 | | |
2410 | | static av_cold int rv60_decode_end(AVCodecContext * avctx) |
2411 | 5.59k | { |
2412 | 5.59k | RV60Context *s = avctx->priv_data; |
2413 | | |
2414 | 22.3k | for (int i = 0; i < 3; i++) |
2415 | 16.7k | av_frame_free(&s->last_frame[i]); |
2416 | | |
2417 | 5.59k | av_freep(&s->slice); |
2418 | 5.59k | av_freep(&s->pu_info); |
2419 | 5.59k | av_freep(&s->blk_info); |
2420 | 5.59k | av_freep(&s->top_str); |
2421 | 5.59k | av_freep(&s->left_str); |
2422 | | |
2423 | 29.3k | for (int i = 0; i < s->nb_progress; i++) |
2424 | 23.7k | ff_thread_progress_destroy(&s->progress[i]); |
2425 | 5.59k | av_freep(&s->progress); |
2426 | | |
2427 | 5.59k | return 0; |
2428 | 5.59k | } |
2429 | | |
2430 | | const FFCodec ff_rv60_decoder = { |
2431 | | .p.name = "rv60", |
2432 | | CODEC_LONG_NAME("RealVideo 6.0"), |
2433 | | .p.type = AVMEDIA_TYPE_VIDEO, |
2434 | | .p.id = AV_CODEC_ID_RV60, |
2435 | | .priv_data_size = sizeof(RV60Context), |
2436 | | .init = rv60_decode_init, |
2437 | | .close = rv60_decode_end, |
2438 | | FF_CODEC_DECODE_CB(rv60_decode_frame), |
2439 | | .flush = rv60_flush, |
2440 | | .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_DELAY | AV_CODEC_CAP_SLICE_THREADS, |
2441 | | .caps_internal = FF_CODEC_CAP_INIT_CLEANUP, |
2442 | | }; |