Coverage Report

Created: 2025-12-31 07:57

next uncovered line (L), next uncovered region (R), next uncovered branch (B)
/src/ffmpeg/libavcodec/motion_est.c
Line
Count
Source
1
/*
2
 * Motion estimation
3
 * Copyright (c) 2000,2001 Fabrice Bellard
4
 * Copyright (c) 2002-2004 Michael Niedermayer
5
 *
6
 * new motion estimation (X1/EPZS) by Michael Niedermayer <michaelni@gmx.at>
7
 *
8
 * This file is part of FFmpeg.
9
 *
10
 * FFmpeg is free software; you can redistribute it and/or
11
 * modify it under the terms of the GNU Lesser General Public
12
 * License as published by the Free Software Foundation; either
13
 * version 2.1 of the License, or (at your option) any later version.
14
 *
15
 * FFmpeg is distributed in the hope that it will be useful,
16
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
17
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
18
 * Lesser General Public License for more details.
19
 *
20
 * You should have received a copy of the GNU Lesser General Public
21
 * License along with FFmpeg; if not, write to the Free Software
22
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
23
 */
24
25
/**
26
 * @file
27
 * Motion estimation.
28
 */
29
30
#include <stdlib.h>
31
#include <stdio.h>
32
#include <limits.h>
33
34
#include "avcodec.h"
35
#include "h263.h"
36
#include "mathops.h"
37
#include "motion_est.h"
38
#include "mpegutils.h"
39
#include "mpegvideoenc.h"
40
41
2.49M
#define P_LEFT P[1]
42
1.27M
#define P_TOP P[2]
43
1.49M
#define P_TOPRIGHT P[3]
44
436k
#define P_MEDIAN P[4]
45
0
#define P_MV1 P[9]
46
47
19.6M
#define ME_MAP_SHIFT 3
48
18.7M
#define ME_MAP_MV_BITS 11
49
50
static int sad_hpel_motion_search(MPVEncContext *const s,
51
                                  int *mx_ptr, int *my_ptr, int dmin,
52
                                  int src_index, int ref_index,
53
                                  int size, int h);
54
55
static inline unsigned update_map_generation(MotionEstContext *c)
56
923k
{
57
923k
    c->map_generation+= 1<<(ME_MAP_MV_BITS*2);
58
923k
    if(c->map_generation==0){
59
306
        c->map_generation= 1<<(ME_MAP_MV_BITS*2);
60
306
        memset(c->map, 0, sizeof(uint32_t)*ME_MAP_SIZE);
61
306
    }
62
923k
    return c->map_generation;
63
923k
}
64
65
/* shape adaptive search stuff */
66
typedef struct Minima{
67
    int height;
68
    int x, y;
69
    int checked;
70
}Minima;
71
72
0
static int minima_cmp(const void *a, const void *b){
73
0
    const Minima *da = (const Minima *) a;
74
0
    const Minima *db = (const Minima *) b;
75
76
0
    return da->height - db->height;
77
0
}
78
79
3.64M
#define FLAG_QPEL   1 //must be 1
80
541k
#define FLAG_CHROMA 2
81
541k
#define FLAG_DIRECT 4
82
83
static inline void init_ref(MotionEstContext *c, uint8_t *const src[3],
84
                            uint8_t *const ref[3], uint8_t *const ref2[3],
85
                            int x, int y, int ref_index)
86
381k
{
87
381k
    const int offset[3]= {
88
381k
          y*c->  stride + x,
89
381k
        ((y*c->uvstride + x)>>1),
90
381k
        ((y*c->uvstride + x)>>1),
91
381k
    };
92
381k
    int i;
93
1.52M
    for(i=0; i<3; i++){
94
1.14M
        c->src[0][i]= src[i] ? src[i] + offset[i] : NULL;
95
1.14M
        c->ref[0][i]= ref[i] ? ref[i] + offset[i] : NULL;
96
1.14M
    }
97
381k
    if(ref_index){
98
0
        for(i=0; i<3; i++){
99
0
            c->ref[ref_index][i]= ref2[i] ? ref2[i] + offset[i] : NULL;
100
0
        }
101
0
    }
102
381k
}
103
104
41.3k
static int get_flags(MotionEstContext *c, int direct, int chroma){
105
41.3k
    return   ((c->avctx->flags&AV_CODEC_FLAG_QPEL) ? FLAG_QPEL : 0)
106
41.3k
           + (direct ? FLAG_DIRECT : 0)
107
41.3k
           + (chroma ? FLAG_CHROMA : 0);
108
41.3k
}
109
110
static av_always_inline int cmp_direct_inline(MPVEncContext *const s, const int x, const int y, const int subx, const int suby,
111
                      const int size, const int h, int ref_index, int src_index,
112
0
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func, int qpel){
113
0
    MotionEstContext *const c = &s->me;
114
0
    const int stride= c->stride;
115
0
    const int hx = subx + x * (1 << (1 + qpel));
116
0
    const int hy = suby + y * (1 << (1 + qpel));
117
0
    const uint8_t * const * const ref = c->ref[ref_index];
118
0
    const uint8_t * const * const src = c->src[src_index];
119
0
    int d;
120
    //FIXME check chroma 4mv, (no crashes ...)
121
0
    av_assert2(x >= c->xmin && hx <= c->xmax<<(qpel+1) && y >= c->ymin && hy <= c->ymax<<(qpel+1));
122
0
    if (x >= c->xmin && hx <= c->xmax << (qpel + 1) &&
123
0
        y >= c->ymin && hy <= c->ymax << (qpel + 1)) {
124
0
        const int time_pp = s->c.pp_time;
125
0
        const int time_pb = s->c.pb_time;
126
0
        const int mask    = 2 * qpel + 1;
127
0
        if (s->c.mv_type == MV_TYPE_8X8) {
128
0
            for(int i = 0; i < 4; ++i) {
129
0
                int fx  = c->direct_basis_mv[i][0] + hx;
130
0
                int fy  = c->direct_basis_mv[i][1] + hy;
131
0
                int bx  = hx ? fx - c->co_located_mv[i][0] : c->co_located_mv[i][0] * (time_pb - time_pp)/time_pp + ((i &1)<<(qpel+4));
132
0
                int by  = hy ? fy - c->co_located_mv[i][1] : c->co_located_mv[i][1] * (time_pb - time_pp)/time_pp + ((i>>1)<<(qpel+4));
133
0
                int fxy = (fx & mask) + ((fy & mask) << (qpel + 1));
134
0
                int bxy = (bx & mask) + ((by & mask) << (qpel + 1));
135
136
0
                uint8_t *dst = c->temp + 8 * (i & 1) + 8 * stride * (i >> 1);
137
0
                if (qpel) {
138
0
                    c->qpel_put[1][fxy](dst, ref[0] + (fx >> 2) + (fy >> 2) * stride, stride);
139
0
                    c->qpel_avg[1][bxy](dst, ref[8] + (bx >> 2) + (by >> 2) * stride, stride);
140
0
                } else {
141
0
                    c->hpel_put[1][fxy](dst, ref[0] + (fx >> 1) + (fy >> 1) * stride, stride, 8);
142
0
                    c->hpel_avg[1][bxy](dst, ref[8] + (bx >> 1) + (by >> 1) * stride, stride, 8);
143
0
                }
144
0
            }
145
0
        } else {
146
0
            int fx  = c->direct_basis_mv[0][0] + hx;
147
0
            int fy  = c->direct_basis_mv[0][1] + hy;
148
0
            int bx  = hx ? fx - c->co_located_mv[0][0] : (c->co_located_mv[0][0] * (time_pb - time_pp)/time_pp);
149
0
            int by  = hy ? fy - c->co_located_mv[0][1] : (c->co_located_mv[0][1] * (time_pb - time_pp)/time_pp);
150
0
            int fxy = (fx & mask) + ((fy & mask) << (qpel + 1));
151
0
            int bxy = (bx & mask) + ((by & mask) << (qpel + 1));
152
153
0
            if (qpel) {
154
0
                c->qpel_put[1][fxy](c->temp               , ref[0] + (fx>>2) + (fy>>2)*stride               , stride);
155
0
                c->qpel_put[1][fxy](c->temp + 8           , ref[0] + (fx>>2) + (fy>>2)*stride + 8           , stride);
156
0
                c->qpel_put[1][fxy](c->temp     + 8*stride, ref[0] + (fx>>2) + (fy>>2)*stride     + 8*stride, stride);
157
0
                c->qpel_put[1][fxy](c->temp + 8 + 8*stride, ref[0] + (fx>>2) + (fy>>2)*stride + 8 + 8*stride, stride);
158
0
                c->qpel_avg[1][bxy](c->temp               , ref[8] + (bx>>2) + (by>>2)*stride               , stride);
159
0
                c->qpel_avg[1][bxy](c->temp + 8           , ref[8] + (bx>>2) + (by>>2)*stride + 8           , stride);
160
0
                c->qpel_avg[1][bxy](c->temp     + 8*stride, ref[8] + (bx>>2) + (by>>2)*stride     + 8*stride, stride);
161
0
                c->qpel_avg[1][bxy](c->temp + 8 + 8*stride, ref[8] + (bx>>2) + (by>>2)*stride + 8 + 8*stride, stride);
162
0
            } else {
163
0
                av_assert2((fx >> 1) + 16 * s->c.mb_x >= -16);
164
0
                av_assert2((fy >> 1) + 16 * s->c.mb_y >= -16);
165
0
                av_assert2((fx >> 1) + 16 * s->c.mb_x <= s->c.width);
166
0
                av_assert2((fy >> 1) + 16 * s->c.mb_y <= s->c.height);
167
0
                av_assert2((bx >> 1) + 16 * s->c.mb_x >= -16);
168
0
                av_assert2((by >> 1) + 16 * s->c.mb_y >= -16);
169
0
                av_assert2((bx >> 1) + 16 * s->c.mb_x <= s->c.width);
170
0
                av_assert2((by >> 1) + 16 * s->c.mb_y <= s->c.height);
171
172
0
                c->hpel_put[0][fxy](c->temp, ref[0] + (fx >> 1) + (fy >> 1) * stride, stride, 16);
173
0
                c->hpel_avg[0][bxy](c->temp, ref[8] + (bx >> 1) + (by >> 1) * stride, stride, 16);
174
0
            }
175
0
        }
176
0
        d = cmp_func(s, c->temp, src[0], stride, 16);
177
0
    } else
178
0
        d = 256 * 256 * 256 * 32;
179
0
    return d;
180
0
}
181
182
static av_always_inline int cmp_inline(MPVEncContext *const s, const int x, const int y, const int subx, const int suby,
183
                      const int size, const int h, int ref_index, int src_index,
184
13.6M
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func, int qpel, int chroma){
185
13.6M
    MotionEstContext *const c = &s->me;
186
13.6M
    const int stride= c->stride;
187
13.6M
    const int uvstride= c->uvstride;
188
13.6M
    const int dxy= subx + (suby<<(1+qpel)); //FIXME log2_subpel?
189
13.6M
    const int hx= subx + x*(1<<(1+qpel));
190
13.6M
    const int hy= suby + y*(1<<(1+qpel));
191
13.6M
    const uint8_t * const * const ref = c->ref[ref_index];
192
13.6M
    const uint8_t * const * const src = c->src[src_index];
193
13.6M
    int d;
194
    //FIXME check chroma 4mv, (no crashes ...)
195
13.6M
    int uvdxy;              /* no, it might not be used uninitialized */
196
13.6M
    if (dxy) {
197
139k
        if (qpel) {
198
0
            if (h << size == 16) {
199
0
                c->qpel_put[size][dxy](c->temp,  ref[0] + x + y * stride, stride); //FIXME prototype (add h)
200
0
            } else if (size == 0 && h == 8) {
201
0
                c->qpel_put[1][dxy](c->temp    , ref[0] + x + y * stride    , stride);
202
0
                c->qpel_put[1][dxy](c->temp + 8, ref[0] + x + y * stride + 8, stride);
203
0
            } else
204
0
                av_assert2(0);
205
0
            if (chroma) {
206
0
                int cx = hx / 2;
207
0
                int cy = hy / 2;
208
0
                cx = (cx >> 1) | (cx & 1);
209
0
                cy = (cy >> 1) | (cy & 1);
210
0
                uvdxy = (cx & 1) + 2 * (cy & 1);
211
                // FIXME x/y wrong, but MPEG-4 qpel is sick anyway, we should drop as much of it as possible in favor for H.264
212
0
            }
213
139k
        } else {
214
139k
            c->hpel_put[size][dxy](c->temp, ref[0] + x + y * stride, stride, h);
215
139k
            if (chroma)
216
0
                uvdxy = dxy | (x & 1) | (2 * (y & 1));
217
139k
        }
218
139k
        d = cmp_func(s, c->temp, src[0], stride, h);
219
13.5M
    } else {
220
13.5M
        d = cmp_func(s, src[0], ref[0] + x + y * stride, stride, h);
221
13.5M
        if (chroma)
222
0
            uvdxy = (x & 1) + 2 * (y & 1);
223
13.5M
    }
224
13.6M
    if (chroma) {
225
0
        uint8_t *const uvtemp = c->temp + 16 * stride;
226
0
        c->hpel_put[size + 1][uvdxy](uvtemp    , ref[1] + (x >> 1) + (y >> 1) * uvstride, uvstride, h >> 1);
227
0
        c->hpel_put[size + 1][uvdxy](uvtemp + 8, ref[2] + (x >> 1) + (y >> 1) * uvstride, uvstride, h >> 1);
228
0
        d += chroma_cmp_func(s, uvtemp    , src[1], uvstride, h >> 1);
229
0
        d += chroma_cmp_func(s, uvtemp + 8, src[2], uvstride, h >> 1);
230
0
    }
231
13.6M
    return d;
232
13.6M
}
233
234
static int cmp_simple(MPVEncContext *const s, const int x, const int y,
235
                      int ref_index, int src_index,
236
13.1M
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func){
237
13.1M
    return cmp_inline(s,x,y,0,0,0,16,ref_index,src_index, cmp_func, chroma_cmp_func, 0, 0);
238
13.1M
}
239
240
static int cmp_fpel_internal(MPVEncContext *const s, const int x, const int y,
241
                      const int size, const int h, int ref_index, int src_index,
242
0
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func, const int flags){
243
0
    if(flags&FLAG_DIRECT){
244
0
        return cmp_direct_inline(s,x,y,0,0,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, flags&FLAG_QPEL);
245
0
    }else{
246
0
        return cmp_inline(s,x,y,0,0,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, 0, flags&FLAG_CHROMA);
247
0
    }
248
0
}
249
250
static int cmp_internal(MPVEncContext *const s, const int x, const int y, const int subx, const int suby,
251
                      const int size, const int h, int ref_index, int src_index,
252
541k
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func, const int flags){
253
541k
    if(flags&FLAG_DIRECT){
254
0
        return cmp_direct_inline(s,x,y,subx,suby,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, flags&FLAG_QPEL);
255
541k
    }else{
256
541k
        return cmp_inline(s,x,y,subx,suby,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, flags&FLAG_QPEL, flags&FLAG_CHROMA);
257
541k
    }
258
541k
}
259
260
/** @brief compares a block (either a full macroblock or a partition thereof)
261
    against a proposed motion-compensated prediction of that block
262
 */
263
static av_always_inline int cmp(MPVEncContext *const s, const int x, const int y, const int subx, const int suby,
264
                      const int size, const int h, int ref_index, int src_index,
265
13.6M
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func, const int flags){
266
13.6M
    if(av_builtin_constant_p(flags) && av_builtin_constant_p(h) && av_builtin_constant_p(size)
267
13.1M
       && av_builtin_constant_p(subx) && av_builtin_constant_p(suby)
268
13.1M
       && flags==0 && h==16 && size==0 && subx==0 && suby==0){
269
13.1M
        return cmp_simple(s,x,y,ref_index,src_index, cmp_func, chroma_cmp_func);
270
13.1M
    }else if(av_builtin_constant_p(subx) && av_builtin_constant_p(suby)
271
0
       && subx==0 && suby==0){
272
0
        return cmp_fpel_internal(s,x,y,size,h,ref_index,src_index, cmp_func, chroma_cmp_func,flags);
273
541k
    }else{
274
541k
        return cmp_internal(s,x,y,subx,suby,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, flags);
275
541k
    }
276
13.6M
}
277
278
static int cmp_hpel(MPVEncContext *const s, const int x, const int y, const int subx, const int suby,
279
                      const int size, const int h, int ref_index, int src_index,
280
0
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func, const int flags){
281
0
    if(flags&FLAG_DIRECT){
282
0
        return cmp_direct_inline(s,x,y,subx,suby,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, 0);
283
0
    }else{
284
0
        return cmp_inline(s,x,y,subx,suby,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, 0, flags&FLAG_CHROMA);
285
0
    }
286
0
}
287
288
static int cmp_qpel(MPVEncContext *const s, const int x, const int y, const int subx, const int suby,
289
                      const int size, const int h, int ref_index, int src_index,
290
0
                      me_cmp_func cmp_func, me_cmp_func chroma_cmp_func, const int flags){
291
0
    if(flags&FLAG_DIRECT){
292
0
        return cmp_direct_inline(s,x,y,subx,suby,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, 1);
293
0
    }else{
294
0
        return cmp_inline(s,x,y,subx,suby,size,h,ref_index,src_index, cmp_func, chroma_cmp_func, 1, flags&FLAG_CHROMA);
295
0
    }
296
0
}
297
298
#include "motion_est_template.c"
299
300
static int zero_cmp(MPVEncContext *const s, const uint8_t *a, const uint8_t *b,
301
                    ptrdiff_t stride, int h)
302
0
{
303
0
    return 0;
304
0
}
305
306
0
static void zero_hpel(uint8_t *a, const uint8_t *b, ptrdiff_t stride, int h){
307
0
}
308
309
av_cold int ff_me_init(MotionEstContext *c, AVCodecContext *avctx,
310
                       const MECmpContext *mecc, int mpvenc)
311
13.7k
{
312
13.7k
    int cache_size = FFMIN(ME_MAP_SIZE>>ME_MAP_SHIFT, 1<<ME_MAP_SHIFT);
313
13.7k
    int dia_size   = FFMAX(FFABS(avctx->dia_size) & 255, FFABS(avctx->pre_dia_size) & 255);
314
13.7k
    int ret;
315
316
13.7k
    if (FFMIN(avctx->dia_size, avctx->pre_dia_size) < -FFMIN(ME_MAP_SIZE, MAX_SAB_SIZE)) {
317
0
        av_log(avctx, AV_LOG_ERROR, "ME_MAP size is too small for SAB diamond\n");
318
0
        return AVERROR(EINVAL);
319
0
    }
320
321
13.7k
    c->avctx = avctx;
322
323
13.7k
    if (avctx->codec_id == AV_CODEC_ID_H261)
324
472
        avctx->me_sub_cmp = avctx->me_cmp;
325
326
13.7k
    if (cache_size < 2 * dia_size)
327
0
        av_log(avctx, AV_LOG_INFO, "ME_MAP size may be a little small for the selected diamond size\n");
328
329
13.7k
    ret  = ff_set_cmp(mecc, c->me_pre_cmp, avctx->me_pre_cmp, mpvenc);
330
13.7k
    ret |= ff_set_cmp(mecc, c->me_cmp,     avctx->me_cmp,     mpvenc);
331
13.7k
    ret |= ff_set_cmp(mecc, c->me_sub_cmp, avctx->me_sub_cmp, mpvenc);
332
13.7k
    ret |= ff_set_cmp(mecc, c->mb_cmp,     avctx->mb_cmp,     mpvenc);
333
13.7k
    if (ret < 0)
334
0
        return ret;
335
336
13.7k
    c->sse = mecc->sse[0];
337
13.7k
    memcpy(c->pix_abs, mecc->pix_abs, sizeof(c->pix_abs));
338
339
13.7k
    c->flags     = get_flags(c, 0, avctx->me_cmp     & FF_CMP_CHROMA);
340
13.7k
    c->sub_flags = get_flags(c, 0, avctx->me_sub_cmp & FF_CMP_CHROMA);
341
13.7k
    c->mb_flags  = get_flags(c, 0, avctx->mb_cmp     & FF_CMP_CHROMA);
342
343
13.7k
    if (avctx->codec_id == AV_CODEC_ID_H261) {
344
472
        c->sub_motion_search = no_sub_motion_search;
345
13.3k
    } else if (avctx->flags & AV_CODEC_FLAG_QPEL) {
346
0
        c->sub_motion_search= qpel_motion_search;
347
13.3k
    }else{
348
13.3k
        if(c->avctx->me_sub_cmp&FF_CMP_CHROMA)
349
0
            c->sub_motion_search= hpel_motion_search;
350
13.3k
        else if(   c->avctx->me_sub_cmp == FF_CMP_SAD
351
13.3k
                && c->avctx->    me_cmp == FF_CMP_SAD
352
13.3k
                && c->avctx->    mb_cmp == FF_CMP_SAD)
353
13.3k
            c->sub_motion_search= sad_hpel_motion_search; // 2050 vs. 2450 cycles
354
0
        else
355
0
            c->sub_motion_search= hpel_motion_search;
356
13.3k
    }
357
358
    /* 8x8 fullpel search would need a 4x4 chroma compare, which we do
359
     * not have yet, and even if we had, the motion estimation code
360
     * does not expect it. */
361
13.7k
    if (avctx->codec_id != AV_CODEC_ID_SNOW) {
362
9.72k
        if ((avctx->me_cmp & FF_CMP_CHROMA) /* && !c->me_cmp[2] */)
363
0
            c->me_cmp[2] = zero_cmp;
364
9.72k
        if ((avctx->me_sub_cmp & FF_CMP_CHROMA) && !c->me_sub_cmp[2])
365
0
            c->me_sub_cmp[2] = zero_cmp;
366
9.72k
    }
367
368
13.7k
    return 0;
369
13.7k
}
370
371
void ff_me_init_pic(MPVEncContext *const s)
372
101k
{
373
101k
    MotionEstContext *const c = &s->me;
374
375
/*FIXME s->c.no_rounding b_type*/
376
101k
    if (c->avctx->flags & AV_CODEC_FLAG_QPEL) {
377
0
        c->qpel_avg = s->c.qdsp.avg_qpel_pixels_tab;
378
0
        if (s->c.no_rounding)
379
0
            c->qpel_put = s->c.qdsp.put_no_rnd_qpel_pixels_tab;
380
0
        else
381
0
            c->qpel_put = s->c.qdsp.put_qpel_pixels_tab;
382
0
    }
383
101k
    c->hpel_avg = s->c.hdsp.avg_pixels_tab;
384
101k
    if (s->c.no_rounding)
385
1.49k
        c->hpel_put = s->c.hdsp.put_no_rnd_pixels_tab;
386
99.8k
    else
387
99.8k
        c->hpel_put = s->c.hdsp.put_pixels_tab;
388
389
101k
    if (s->c.linesize) {
390
101k
        c->stride   = s->c.linesize;
391
101k
        c->uvstride = s->c.uvlinesize;
392
101k
    }else{
393
0
        c->stride   = 16*s->c.mb_width + 32;
394
0
        c->uvstride =  8*s->c.mb_width + 16;
395
0
    }
396
101k
    if (s->c.codec_id != AV_CODEC_ID_SNOW) {
397
101k
        c->hpel_put[2][0]= c->hpel_put[2][1]=
398
101k
        c->hpel_put[2][2]= c->hpel_put[2][3]= zero_hpel;
399
101k
    }
400
    /* Reset the average MB variance and scene change stats */
401
101k
    c->scene_change_score = 0;
402
101k
    c->mb_var_sum_temp    =
403
101k
    c->mc_mb_var_sum_temp = 0;
404
101k
}
405
406
2.34M
#define CHECK_SAD_HALF_MV(suffix, x, y) \
407
2.34M
{\
408
2.34M
    d  = c->pix_abs[size][(x ? 1 : 0) + (y ? 2 : 0)](NULL, pix, ptr + ((x) >> 1), stride, h); \
409
2.34M
    d += (mv_penalty[pen_x + x] + mv_penalty[pen_y + y])*penalty_factor;\
410
2.34M
    COPY3_IF_LT(dminh, d, dx, x, dy, y)\
411
2.34M
}
412
413
static int sad_hpel_motion_search(MPVEncContext *const s,
414
                                  int *mx_ptr, int *my_ptr, int dmin,
415
                                  int src_index, int ref_index,
416
                                  int size, int h)
417
923k
{
418
923k
    MotionEstContext *const c = &s->me;
419
923k
    const int penalty_factor= c->sub_penalty_factor;
420
923k
    int mx, my, dminh;
421
923k
    const uint8_t *pix, *ptr;
422
923k
    int stride= c->stride;
423
923k
    LOAD_COMMON
424
425
923k
    av_assert2(c->sub_flags == 0);
426
427
923k
    if(c->skip){
428
49.0k
        *mx_ptr = 0;
429
49.0k
        *my_ptr = 0;
430
49.0k
        return dmin;
431
49.0k
    }
432
433
873k
    pix = c->src[src_index][0];
434
435
873k
    mx = *mx_ptr;
436
873k
    my = *my_ptr;
437
873k
    ptr = c->ref[ref_index][0] + (my * stride) + mx;
438
439
873k
    dminh = dmin;
440
441
873k
    if (mx > xmin && mx < xmax &&
442
730k
        my > ymin && my < ymax) {
443
586k
        int dx=0, dy=0;
444
586k
        int d, pen_x, pen_y;
445
586k
        const int index= my*(1<<ME_MAP_SHIFT) + mx;
446
586k
        const int t= score_map[(index-(1<<ME_MAP_SHIFT))&(ME_MAP_SIZE-1)];
447
586k
        const int l= score_map[(index- 1               )&(ME_MAP_SIZE-1)];
448
586k
        const int r= score_map[(index+ 1               )&(ME_MAP_SIZE-1)];
449
586k
        const int b= score_map[(index+(1<<ME_MAP_SHIFT))&(ME_MAP_SIZE-1)];
450
586k
        mx += mx;
451
586k
        my += my;
452
453
454
586k
        pen_x= pred_x + mx;
455
586k
        pen_y= pred_y + my;
456
457
586k
        ptr-= stride;
458
586k
        if(t<=b){
459
301k
            CHECK_SAD_HALF_MV(y2 , 0, -1)
460
301k
            if(l<=r){
461
182k
                CHECK_SAD_HALF_MV(xy2, -1, -1)
462
182k
                if(t+r<=b+l){
463
129k
                    CHECK_SAD_HALF_MV(xy2, +1, -1)
464
129k
                    ptr+= stride;
465
129k
                }else{
466
53.4k
                    ptr+= stride;
467
53.4k
                    CHECK_SAD_HALF_MV(xy2, -1, +1)
468
53.4k
                }
469
182k
                CHECK_SAD_HALF_MV(x2 , -1,  0)
470
182k
            }else{
471
118k
                CHECK_SAD_HALF_MV(xy2, +1, -1)
472
118k
                if(t+l<=b+r){
473
75.8k
                    CHECK_SAD_HALF_MV(xy2, -1, -1)
474
75.8k
                    ptr+= stride;
475
75.8k
                }else{
476
42.5k
                    ptr+= stride;
477
42.5k
                    CHECK_SAD_HALF_MV(xy2, +1, +1)
478
42.5k
                }
479
118k
                CHECK_SAD_HALF_MV(x2 , +1,  0)
480
118k
            }
481
301k
        }else{
482
285k
            if(l<=r){
483
146k
                if(t+l<=b+r){
484
44.0k
                    CHECK_SAD_HALF_MV(xy2, -1, -1)
485
44.0k
                    ptr+= stride;
486
102k
                }else{
487
102k
                    ptr+= stride;
488
102k
                    CHECK_SAD_HALF_MV(xy2, +1, +1)
489
102k
                }
490
146k
                CHECK_SAD_HALF_MV(x2 , -1,  0)
491
146k
                CHECK_SAD_HALF_MV(xy2, -1, +1)
492
146k
            }else{
493
139k
                if(t+r<=b+l){
494
50.3k
                    CHECK_SAD_HALF_MV(xy2, +1, -1)
495
50.3k
                    ptr+= stride;
496
89.0k
                }else{
497
89.0k
                    ptr+= stride;
498
89.0k
                    CHECK_SAD_HALF_MV(xy2, -1, +1)
499
89.0k
                }
500
139k
                CHECK_SAD_HALF_MV(x2 , +1,  0)
501
139k
                CHECK_SAD_HALF_MV(xy2, +1, +1)
502
139k
            }
503
285k
            CHECK_SAD_HALF_MV(y2 ,  0, +1)
504
285k
        }
505
586k
        mx+=dx;
506
586k
        my+=dy;
507
508
586k
    }else{
509
287k
        mx += mx;
510
287k
        my += my;
511
287k
    }
512
513
873k
    *mx_ptr = mx;
514
873k
    *my_ptr = my;
515
873k
    return dminh;
516
923k
}
517
518
static inline void set_p_mv_tables(MPVEncContext *const s, int mx, int my, int mv4)
519
381k
{
520
381k
    const int xy = s->c.mb_x + s->c.mb_y * s->c.mb_stride;
521
522
381k
    s->p_mv_table[xy][0] = mx;
523
381k
    s->p_mv_table[xy][1] = my;
524
525
    /* has already been set to the 4 MV if 4MV is done */
526
381k
    if(mv4){
527
381k
        int mot_xy = s->c.block_index[0];
528
529
381k
        s->c.cur_pic.motion_val[0][mot_xy    ][0] = mx;
530
381k
        s->c.cur_pic.motion_val[0][mot_xy    ][1] = my;
531
381k
        s->c.cur_pic.motion_val[0][mot_xy + 1][0] = mx;
532
381k
        s->c.cur_pic.motion_val[0][mot_xy + 1][1] = my;
533
534
381k
        mot_xy += s->c.b8_stride;
535
381k
        s->c.cur_pic.motion_val[0][mot_xy    ][0] = mx;
536
381k
        s->c.cur_pic.motion_val[0][mot_xy    ][1] = my;
537
381k
        s->c.cur_pic.motion_val[0][mot_xy + 1][0] = mx;
538
381k
        s->c.cur_pic.motion_val[0][mot_xy + 1][1] = my;
539
381k
    }
540
381k
}
541
542
/**
543
 * get fullpel ME search limits.
544
 */
545
static inline void get_limits(MPVEncContext *const s, int x, int y, int bframe)
546
381k
{
547
381k
    MotionEstContext *const c = &s->me;
548
381k
    int range= c->avctx->me_range >> (1 + !!(c->flags&FLAG_QPEL));
549
381k
    int max_range = MAX_MV >> (1 + !!(c->flags&FLAG_QPEL));
550
/*
551
    if(c->avctx->me_range) c->range= c->avctx->me_range >> 1;
552
    else                   c->range= 16;
553
*/
554
381k
    if (c->unrestricted_mv) {
555
0
        c->xmin = - x - 16;
556
0
        c->ymin = - y - 16;
557
0
        c->xmax = - x + s->c.width;
558
0
        c->ymax = - y + s->c.height;
559
381k
    } else if (!(av_builtin_constant_p(bframe) && bframe) && s->c.out_format == FMT_H261){
560
        // Search range of H.261 is different from other codec standards
561
0
        c->xmin = (x > 15) ? - 15 : 0;
562
0
        c->ymin = (y > 15) ? - 15 : 0;
563
0
        c->xmax = (x < s->c.mb_width * 16 - 16) ? 15 : 0;
564
0
        c->ymax = (y < s->c.mb_height * 16 - 16) ? 15 : 0;
565
381k
    } else {
566
381k
        c->xmin = - x;
567
381k
        c->ymin = - y;
568
381k
        c->xmax = - x + s->c.mb_width *16 - 16;
569
381k
        c->ymax = - y + s->c.mb_height*16 - 16;
570
381k
    }
571
381k
    if(!range || range > max_range)
572
381k
        range = max_range;
573
381k
    if(range){
574
381k
        c->xmin = FFMAX(c->xmin,-range);
575
381k
        c->xmax = FFMIN(c->xmax, range);
576
381k
        c->ymin = FFMAX(c->ymin,-range);
577
381k
        c->ymax = FFMIN(c->ymax, range);
578
381k
    }
579
381k
}
580
581
0
static inline void init_mv4_ref(MotionEstContext *c){
582
0
    const int stride= c->stride;
583
584
0
    c->ref[1][0] = c->ref[0][0] + 8;
585
0
    c->ref[2][0] = c->ref[0][0] + 8*stride;
586
0
    c->ref[3][0] = c->ref[2][0] + 8;
587
0
    c->src[1][0] = c->src[0][0] + 8;
588
0
    c->src[2][0] = c->src[0][0] + 8*stride;
589
0
    c->src[3][0] = c->src[2][0] + 8;
590
0
}
591
592
static inline int h263_mv4_search(MPVEncContext *const s, int mx, int my, int shift)
593
0
{
594
0
    MotionEstContext *const c = &s->me;
595
0
    const int size= 1;
596
0
    const int h=8;
597
0
    int block;
598
0
    int P[10][2];
599
0
    int dmin_sum=0, mx4_sum=0, my4_sum=0, i;
600
0
    int same=1;
601
0
    const int stride= c->stride;
602
0
    const uint8_t *mv_penalty = c->current_mv_penalty;
603
0
    int safety_clipping = c->unrestricted_mv && (s->c.width&15) && (s->c.height&15);
604
605
0
    init_mv4_ref(c);
606
607
0
    for(block=0; block<4; block++){
608
0
        int mx4, my4;
609
0
        int pred_x4, pred_y4;
610
0
        int dmin4;
611
0
        static const int off[4]= {2, 1, 1, -1};
612
0
        const int mot_stride = s->c.b8_stride;
613
0
        const int mot_xy = s->c.block_index[block];
614
615
0
        if(safety_clipping){
616
0
            c->xmax = - 16*s->c.mb_x + s->c.width  - 8*(block &1);
617
0
            c->ymax = - 16*s->c.mb_y + s->c.height - 8*(block>>1);
618
0
        }
619
620
0
        P_LEFT[0] = s->c.cur_pic.motion_val[0][mot_xy - 1][0];
621
0
        P_LEFT[1] = s->c.cur_pic.motion_val[0][mot_xy - 1][1];
622
623
0
        if (P_LEFT[0] > c->xmax * (1 << shift)) P_LEFT[0] = c->xmax * (1 << shift);
624
625
        /* special case for first line */
626
0
        if (s->c.first_slice_line && block < 2) {
627
0
            c->pred_x= pred_x4= P_LEFT[0];
628
0
            c->pred_y= pred_y4= P_LEFT[1];
629
0
        } else {
630
0
            P_TOP[0]      = s->c.cur_pic.motion_val[0][mot_xy - mot_stride             ][0];
631
0
            P_TOP[1]      = s->c.cur_pic.motion_val[0][mot_xy - mot_stride             ][1];
632
0
            P_TOPRIGHT[0] = s->c.cur_pic.motion_val[0][mot_xy - mot_stride + off[block]][0];
633
0
            P_TOPRIGHT[1] = s->c.cur_pic.motion_val[0][mot_xy - mot_stride + off[block]][1];
634
0
            if (P_TOP[1]      > c->ymax * (1 << shift)) P_TOP[1]      = c->ymax * (1 << shift);
635
0
            if (P_TOPRIGHT[0] < c->xmin * (1 << shift)) P_TOPRIGHT[0] = c->xmin * (1 << shift);
636
0
            if (P_TOPRIGHT[0] > c->xmax * (1 << shift)) P_TOPRIGHT[0] = c->xmax * (1 << shift);
637
0
            if (P_TOPRIGHT[1] > c->ymax * (1 << shift)) P_TOPRIGHT[1] = c->ymax * (1 << shift);
638
639
0
            P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]);
640
0
            P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]);
641
642
0
            c->pred_x= pred_x4 = P_MEDIAN[0];
643
0
            c->pred_y= pred_y4 = P_MEDIAN[1];
644
0
        }
645
0
        P_MV1[0]= mx;
646
0
        P_MV1[1]= my;
647
0
        if(safety_clipping)
648
0
            for(i=1; i<10; i++){
649
0
                if (s->c.first_slice_line && block < 2 && i > 1 && i < 9)
650
0
                    continue;
651
0
                if (i>4 && i<9)
652
0
                    continue;
653
0
                if (P[i][0] > c->xmax * (1 << shift)) P[i][0] = c->xmax * (1 << shift);
654
0
                if (P[i][1] > c->ymax * (1 << shift)) P[i][1] = c->ymax * (1 <<shift );
655
0
            }
656
657
0
        dmin4 = epzs_motion_search2(s, &mx4, &my4, P, block, block, s->p_mv_table, (1<<16)>>shift, 1);
658
659
0
        dmin4= c->sub_motion_search(s, &mx4, &my4, dmin4, block, block, size, h);
660
661
0
        if (c->me_sub_cmp[0] != c->mb_cmp[0]) {
662
0
            int dxy;
663
0
            const int offset= ((block&1) + (block>>1)*stride)*8;
664
0
            uint8_t *dest_y = c->scratchpad + offset;
665
0
            if (s->c.quarter_sample) {
666
0
                const uint8_t *ref = c->ref[block][0] + (mx4>>2) + (my4>>2)*stride;
667
0
                dxy = ((my4 & 3) << 2) | (mx4 & 3);
668
669
0
                c->qpel_put[1][dxy](dest_y, ref, stride);
670
0
            }else{
671
0
                const uint8_t *ref = c->ref[block][0] + (mx4>>1) + (my4>>1)*stride;
672
0
                dxy = ((my4 & 1) << 1) | (mx4 & 1);
673
674
0
                c->hpel_put[1][dxy](dest_y, ref, stride, h);
675
0
            }
676
0
            dmin_sum+= (mv_penalty[mx4-pred_x4] + mv_penalty[my4-pred_y4])*c->mb_penalty_factor;
677
0
        }else
678
0
            dmin_sum+= dmin4;
679
680
0
        if (s->c.quarter_sample) {
681
0
            mx4_sum+= mx4/2;
682
0
            my4_sum+= my4/2;
683
0
        }else{
684
0
            mx4_sum+= mx4;
685
0
            my4_sum+= my4;
686
0
        }
687
688
0
        s->c.cur_pic.motion_val[0][s->c.block_index[block]][0] = mx4;
689
0
        s->c.cur_pic.motion_val[0][s->c.block_index[block]][1] = my4;
690
691
0
        if(mx4 != mx || my4 != my) same=0;
692
0
    }
693
694
0
    if(same)
695
0
        return INT_MAX;
696
697
0
    if (c->me_sub_cmp[0] != c->mb_cmp[0]) {
698
0
        dmin_sum += c->mb_cmp[0](s,
699
0
                                 s->new_pic->data[0] +
700
0
                                 s->c.mb_x * 16 + s->c.mb_y * 16 * stride,
701
0
                                 c->scratchpad, stride, 16);
702
0
    }
703
704
0
    if(c->avctx->mb_cmp&FF_CMP_CHROMA){
705
0
        int dxy;
706
0
        int mx, my;
707
0
        int offset;
708
709
0
        mx= ff_h263_round_chroma(mx4_sum);
710
0
        my= ff_h263_round_chroma(my4_sum);
711
0
        dxy = ((my & 1) << 1) | (mx & 1);
712
713
0
        offset = (s->c.mb_x*8 + (mx>>1)) + (s->c.mb_y*8 + (my>>1))*s->c.uvlinesize;
714
715
0
        c->hpel_put[1][dxy](c->scratchpad    , s->c.last_pic.data[1] + offset, s->c.uvlinesize, 8);
716
0
        c->hpel_put[1][dxy](c->scratchpad + 8, s->c.last_pic.data[2] + offset, s->c.uvlinesize, 8);
717
718
0
        dmin_sum += c->mb_cmp[1](s, s->new_pic->data[1] + s->c.mb_x * 8 + s->c.mb_y * 8 * s->c.uvlinesize, c->scratchpad,     s->c.uvlinesize, 8);
719
0
        dmin_sum += c->mb_cmp[1](s, s->new_pic->data[2] + s->c.mb_x * 8 + s->c.mb_y * 8 * s->c.uvlinesize, c->scratchpad + 8, s->c.uvlinesize, 8);
720
0
    }
721
722
0
    c->pred_x= mx;
723
0
    c->pred_y= my;
724
725
0
    switch(c->avctx->mb_cmp&0xFF){
726
    /*case FF_CMP_SSE:
727
        return dmin_sum+ 32*s->c.qscale*s->c.qscale;*/
728
0
    case FF_CMP_RD:
729
0
        return dmin_sum;
730
0
    default:
731
0
        return dmin_sum+ 11*c->mb_penalty_factor;
732
0
    }
733
0
}
734
735
static inline void init_interlaced_ref(MPVEncContext *const s, int ref_index)
736
0
{
737
0
    MotionEstContext *const c = &s->me;
738
739
0
    c->ref[1+ref_index][0] = c->ref[0+ref_index][0] + s->c.linesize;
740
0
    c->src[1][0] = c->src[0][0] + s->c.linesize;
741
0
    if(c->flags & FLAG_CHROMA){
742
0
        c->ref[1+ref_index][1] = c->ref[0+ref_index][1] + s->c.uvlinesize;
743
0
        c->ref[1+ref_index][2] = c->ref[0+ref_index][2] + s->c.uvlinesize;
744
0
        c->src[1][1] = c->src[0][1] + s->c.uvlinesize;
745
0
        c->src[1][2] = c->src[0][2] + s->c.uvlinesize;
746
0
    }
747
0
}
748
749
static int interlaced_search(MPVEncContext *const s, int ref_index,
750
                             int16_t (*mv_tables[2][2])[2], uint8_t *field_select_tables[2], int mx, int my, int user_field_select)
751
0
{
752
0
    MotionEstContext *const c = &s->me;
753
0
    const int size=0;
754
0
    const int h=8;
755
0
    int block;
756
0
    int P[10][2];
757
0
    const uint8_t * const mv_penalty = c->current_mv_penalty;
758
0
    int same=1;
759
0
    const int stride = 2*s->c.linesize;
760
0
    int dmin_sum= 0;
761
0
    const int mot_stride = s->c.mb_stride;
762
0
    const int xy = s->c.mb_x + s->c.mb_y*mot_stride;
763
764
0
    c->ymin>>=1;
765
0
    c->ymax>>=1;
766
0
    c->stride<<=1;
767
0
    c->uvstride<<=1;
768
0
    init_interlaced_ref(s, ref_index);
769
770
0
    for(block=0; block<2; block++){
771
0
        int field_select;
772
0
        int best_dmin= INT_MAX;
773
0
        int best_field= -1;
774
775
0
        for(field_select=0; field_select<2; field_select++){
776
0
            int dmin, mx_i, my_i;
777
0
            int16_t (*mv_table)[2]= mv_tables[block][field_select];
778
779
0
            if(user_field_select){
780
0
                av_assert1(field_select==0 || field_select==1);
781
0
                av_assert1(field_select_tables[block][xy]==0 || field_select_tables[block][xy]==1);
782
0
                if(field_select_tables[block][xy] != field_select)
783
0
                    continue;
784
0
            }
785
786
0
            P_LEFT[0] = mv_table[xy - 1][0];
787
0
            P_LEFT[1] = mv_table[xy - 1][1];
788
0
            if(P_LEFT[0]       > (c->xmax<<1)) P_LEFT[0]       = (c->xmax<<1);
789
790
0
            c->pred_x= P_LEFT[0];
791
0
            c->pred_y= P_LEFT[1];
792
793
0
            if (!s->c.first_slice_line) {
794
0
                P_TOP[0]      = mv_table[xy - mot_stride][0];
795
0
                P_TOP[1]      = mv_table[xy - mot_stride][1];
796
0
                P_TOPRIGHT[0] = mv_table[xy - mot_stride + 1][0];
797
0
                P_TOPRIGHT[1] = mv_table[xy - mot_stride + 1][1];
798
0
                if(P_TOP[1]      > (c->ymax<<1)) P_TOP[1]     = (c->ymax<<1);
799
0
                if (P_TOPRIGHT[0] < c->xmin * (1 << 1)) P_TOPRIGHT[0] = c->xmin * (1 << 1);
800
0
                if(P_TOPRIGHT[0] > (c->xmax<<1)) P_TOPRIGHT[0]= (c->xmax<<1);
801
0
                if(P_TOPRIGHT[1] > (c->ymax<<1)) P_TOPRIGHT[1]= (c->ymax<<1);
802
803
0
                P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]);
804
0
                P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]);
805
0
            }
806
0
            P_MV1[0]= mx; //FIXME not correct if block != field_select
807
0
            P_MV1[1]= my / 2;
808
809
0
            dmin = epzs_motion_search2(s, &mx_i, &my_i, P, block, field_select+ref_index, mv_table, (1<<16)>>1, 0);
810
811
0
            dmin= c->sub_motion_search(s, &mx_i, &my_i, dmin, block, field_select+ref_index, size, h);
812
813
0
            mv_table[xy][0]= mx_i;
814
0
            mv_table[xy][1]= my_i;
815
816
0
            if (c->me_sub_cmp[0] != c->mb_cmp[0]) {
817
0
                int dxy;
818
819
                //FIXME chroma ME
820
0
                const uint8_t *ref = c->ref[field_select+ref_index][0] + (mx_i>>1) + (my_i>>1)*stride;
821
0
                dxy = ((my_i & 1) << 1) | (mx_i & 1);
822
823
0
                c->hpel_put[size][dxy](c->scratchpad, ref, stride, h);
824
0
                dmin = c->mb_cmp[size](s, c->src[block][0], c->scratchpad, stride, h);
825
0
                dmin+= (mv_penalty[mx_i-c->pred_x] + mv_penalty[my_i-c->pred_y] + 1)*c->mb_penalty_factor;
826
0
            }else
827
0
                dmin+= c->mb_penalty_factor; //field_select bits
828
829
0
            dmin += field_select != block; //slightly prefer same field
830
831
0
            if(dmin < best_dmin){
832
0
                best_dmin= dmin;
833
0
                best_field= field_select;
834
0
            }
835
0
        }
836
0
        {
837
0
            int16_t (*mv_table)[2]= mv_tables[block][best_field];
838
839
0
            if(mv_table[xy][0] != mx) same=0; //FIXME check if these checks work and are any good at all
840
0
            if(mv_table[xy][1]&1) same=0;
841
0
            if(mv_table[xy][1]*2 != my) same=0;
842
0
            if(best_field != block) same=0;
843
0
        }
844
845
0
        field_select_tables[block][xy]= best_field;
846
0
        dmin_sum += best_dmin;
847
0
    }
848
849
0
    c->ymin *= 2;
850
0
    c->ymax<<=1;
851
0
    c->stride>>=1;
852
0
    c->uvstride>>=1;
853
854
0
    if(same)
855
0
        return INT_MAX;
856
857
0
    switch(c->avctx->mb_cmp&0xFF){
858
    /*case FF_CMP_SSE:
859
        return dmin_sum+ 32*s->c.qscale*s->c.qscale;*/
860
0
    case FF_CMP_RD:
861
0
        return dmin_sum;
862
0
    default:
863
0
        return dmin_sum+ 11*c->mb_penalty_factor;
864
0
    }
865
0
}
866
867
1.14M
static inline int get_penalty_factor(int lambda, int lambda2, int type){
868
1.14M
    switch(type&0xFF){
869
0
    default:
870
1.14M
    case FF_CMP_SAD:
871
1.14M
        return lambda>>FF_LAMBDA_SHIFT;
872
0
    case FF_CMP_DCT:
873
0
        return (3*lambda)>>(FF_LAMBDA_SHIFT+1);
874
0
    case FF_CMP_W53:
875
0
        return (4*lambda)>>(FF_LAMBDA_SHIFT);
876
0
    case FF_CMP_W97:
877
0
        return (2*lambda)>>(FF_LAMBDA_SHIFT);
878
0
    case FF_CMP_SATD:
879
0
    case FF_CMP_DCT264:
880
0
        return (2*lambda)>>FF_LAMBDA_SHIFT;
881
0
    case FF_CMP_RD:
882
0
    case FF_CMP_PSNR:
883
0
    case FF_CMP_SSE:
884
0
    case FF_CMP_NSSE:
885
0
        return lambda2>>FF_LAMBDA_SHIFT;
886
0
    case FF_CMP_BIT:
887
0
    case FF_CMP_MEDIAN_SAD:
888
0
        return 1;
889
1.14M
    }
890
1.14M
}
891
892
void ff_estimate_p_frame_motion(MPVEncContext *const s,
893
                                int mb_x, int mb_y)
894
381k
{
895
381k
    MotionEstContext *const c = &s->me;
896
381k
    const uint8_t *pix, *ppix;
897
381k
    int sum, mx = 0, my = 0, dmin = 0;
898
381k
    int varc;            ///< the variance of the block (sum of squared (p[y][x]-average))
899
381k
    int vard;            ///< sum of squared differences with the estimated motion vector
900
381k
    int P[10][2];
901
381k
    const int shift = 1 + s->c.quarter_sample;
902
381k
    int mb_type=0;
903
904
381k
    init_ref(c, s->new_pic->data, s->c.last_pic.data, NULL, 16*mb_x, 16*mb_y, 0);
905
906
381k
    av_assert0(s->c.quarter_sample == 0 || s->c.quarter_sample == 1);
907
381k
    av_assert0(s->c.linesize == c->stride);
908
381k
    av_assert0(s->c.uvlinesize == c->uvstride);
909
910
381k
    c->penalty_factor     = get_penalty_factor(s->lambda, s->lambda2, c->avctx->me_cmp);
911
381k
    c->sub_penalty_factor = get_penalty_factor(s->lambda, s->lambda2, c->avctx->me_sub_cmp);
912
381k
    c->mb_penalty_factor  = get_penalty_factor(s->lambda, s->lambda2, c->avctx->mb_cmp);
913
381k
    c->current_mv_penalty = c->mv_penalty[s->f_code] + MAX_DMV;
914
915
381k
    get_limits(s, 16*mb_x, 16*mb_y, 0);
916
381k
    c->skip=0;
917
918
    /* intra / predictive decision */
919
381k
    pix = c->src[0][0];
920
381k
    sum  = s->mpvencdsp.pix_sum(pix, s->c.linesize);
921
381k
    varc = s->mpvencdsp.pix_norm1(pix, s->c.linesize) -
922
381k
           (((unsigned) sum * sum) >> 8) + 500;
923
924
381k
    s->mb_mean[s->c.mb_stride * mb_y + mb_x] = (sum  + 128) >> 8;
925
381k
    s->mb_var [s->c.mb_stride * mb_y + mb_x] = (varc + 128) >> 8;
926
381k
    c->mb_var_sum_temp += (varc+128)>>8;
927
928
381k
    if (c->motion_est != FF_ME_ZERO) {
929
381k
        const int mot_stride = s->c.b8_stride;
930
381k
        const int mot_xy = s->c.block_index[0];
931
932
381k
        P_LEFT[0] = s->c.cur_pic.motion_val[0][mot_xy - 1][0];
933
381k
        P_LEFT[1] = s->c.cur_pic.motion_val[0][mot_xy - 1][1];
934
935
381k
        if (P_LEFT[0] > (c->xmax << shift))
936
16.3k
            P_LEFT[0] =  c->xmax << shift;
937
938
381k
        if (!s->c.first_slice_line) {
939
218k
            P_TOP[0]      = s->c.cur_pic.motion_val[0][mot_xy - mot_stride    ][0];
940
218k
            P_TOP[1]      = s->c.cur_pic.motion_val[0][mot_xy - mot_stride    ][1];
941
218k
            P_TOPRIGHT[0] = s->c.cur_pic.motion_val[0][mot_xy - mot_stride + 2][0];
942
218k
            P_TOPRIGHT[1] = s->c.cur_pic.motion_val[0][mot_xy - mot_stride + 2][1];
943
218k
            if (P_TOP[1] > (c->ymax << shift))
944
45.3k
                P_TOP[1] =  c->ymax << shift;
945
218k
            if (P_TOPRIGHT[0] < (c->xmin * (1 << shift)))
946
13.4k
                P_TOPRIGHT[0] =  c->xmin * (1 << shift);
947
218k
            if (P_TOPRIGHT[1] > (c->ymax * (1 << shift)))
948
39.3k
                P_TOPRIGHT[1] =  c->ymax * (1 << shift);
949
950
218k
            P_MEDIAN[0] = mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]);
951
218k
            P_MEDIAN[1] = mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]);
952
953
218k
            if (s->c.out_format == FMT_H263) {
954
0
                c->pred_x = P_MEDIAN[0];
955
0
                c->pred_y = P_MEDIAN[1];
956
218k
            } else { /* MPEG-1 at least */
957
218k
                c->pred_x = P_LEFT[0];
958
218k
                c->pred_y = P_LEFT[1];
959
218k
            }
960
218k
        } else {
961
163k
            c->pred_x = P_LEFT[0];
962
163k
            c->pred_y = P_LEFT[1];
963
163k
        }
964
381k
        dmin = ff_epzs_motion_search(s, &mx, &my, P, 0, 0, s->p_mv_table, (1<<16)>>shift, 0, 16);
965
381k
    }
966
967
    /* At this point (mx,my) are full-pell and the relative displacement */
968
381k
    ppix = c->ref[0][0] + (my * s->c.linesize) + mx;
969
970
381k
    vard = c->sse(NULL, pix, ppix, s->c.linesize, 16);
971
972
381k
    s->mc_mb_var[s->c.mb_stride * mb_y + mb_x] = (vard+128)>>8;
973
381k
    c->mc_mb_var_sum_temp += (vard+128)>>8;
974
975
381k
    if (c->avctx->mb_decision > FF_MB_DECISION_SIMPLE) {
976
0
        int p_score = FFMIN(vard, varc - 500 + (s->lambda2 >> FF_LAMBDA_SHIFT)*100);
977
0
        int i_score = varc - 500 + (s->lambda2 >> FF_LAMBDA_SHIFT)*20;
978
0
        c->scene_change_score+= ff_sqrt(p_score) - ff_sqrt(i_score);
979
980
0
        if (vard*2 + 200*256 > varc && !s->intra_penalty)
981
0
            mb_type|= CANDIDATE_MB_TYPE_INTRA;
982
0
        if (varc*2 + 200*256 > vard || s->c.qscale > 24){
983
//        if (varc*2 + 200*256 + 50*(s->lambda2>>FF_LAMBDA_SHIFT) > vard){
984
0
            mb_type|= CANDIDATE_MB_TYPE_INTER;
985
0
            c->sub_motion_search(s, &mx, &my, dmin, 0, 0, 0, 16);
986
0
            if (s->mpv_flags & FF_MPV_FLAG_MV0)
987
0
                if(mx || my)
988
0
                    mb_type |= CANDIDATE_MB_TYPE_SKIPPED; //FIXME check difference
989
0
        }else{
990
0
            mx *= 1 << shift;
991
0
            my *= 1 << shift;
992
0
        }
993
0
        if ((c->avctx->flags & AV_CODEC_FLAG_4MV)
994
0
           && !c->skip && varc>50<<8 && vard>10<<8){
995
0
            if(h263_mv4_search(s, mx, my, shift) < INT_MAX)
996
0
                mb_type|=CANDIDATE_MB_TYPE_INTER4V;
997
998
0
            set_p_mv_tables(s, mx, my, 0);
999
0
        }else
1000
0
            set_p_mv_tables(s, mx, my, 1);
1001
0
        if ((c->avctx->flags & AV_CODEC_FLAG_INTERLACED_ME)
1002
0
           && !c->skip){ //FIXME varc/d checks
1003
0
            if(interlaced_search(s, 0, s->c.p_field_mv_table, s->p_field_select_table, mx, my, 0) < INT_MAX)
1004
0
                mb_type |= CANDIDATE_MB_TYPE_INTER_I;
1005
0
        }
1006
381k
    }else{
1007
381k
        int intra_score, i;
1008
381k
        mb_type= CANDIDATE_MB_TYPE_INTER;
1009
1010
381k
        dmin= c->sub_motion_search(s, &mx, &my, dmin, 0, 0, 0, 16);
1011
381k
        if(c->avctx->me_sub_cmp != c->avctx->mb_cmp && !c->skip)
1012
0
            dmin= get_mb_score(s, mx, my, 0, 0, 0, 16, 1);
1013
1014
381k
        if ((c->avctx->flags & AV_CODEC_FLAG_4MV)
1015
0
           && !c->skip && varc>50<<8 && vard>10<<8){
1016
0
            int dmin4= h263_mv4_search(s, mx, my, shift);
1017
0
            if(dmin4 < dmin){
1018
0
                mb_type= CANDIDATE_MB_TYPE_INTER4V;
1019
0
                dmin=dmin4;
1020
0
            }
1021
0
        }
1022
381k
        if ((c->avctx->flags & AV_CODEC_FLAG_INTERLACED_ME)
1023
0
           && !c->skip){ //FIXME varc/d checks
1024
0
            int dmin_i= interlaced_search(s, 0, s->c.p_field_mv_table, s->p_field_select_table, mx, my, 0);
1025
0
            if(dmin_i < dmin){
1026
0
                mb_type = CANDIDATE_MB_TYPE_INTER_I;
1027
0
                dmin= dmin_i;
1028
0
            }
1029
0
        }
1030
1031
381k
        set_p_mv_tables(s, mx, my, mb_type!=CANDIDATE_MB_TYPE_INTER4V);
1032
1033
        /* get intra luma score */
1034
381k
        if((c->avctx->mb_cmp&0xFF)==FF_CMP_SSE){
1035
0
            intra_score= varc - 500;
1036
381k
        }else{
1037
381k
            unsigned mean = (sum+128)>>8;
1038
381k
            mean*= 0x01010101;
1039
1040
6.49M
            for(i=0; i<16; i++){
1041
6.10M
                *(uint32_t*)(&c->scratchpad[i*s->c.linesize+ 0]) = mean;
1042
6.10M
                *(uint32_t*)(&c->scratchpad[i*s->c.linesize+ 4]) = mean;
1043
6.10M
                *(uint32_t*)(&c->scratchpad[i*s->c.linesize+ 8]) = mean;
1044
6.10M
                *(uint32_t*)(&c->scratchpad[i*s->c.linesize+12]) = mean;
1045
6.10M
            }
1046
1047
381k
            intra_score= c->mb_cmp[0](s, c->scratchpad, pix, s->c.linesize, 16);
1048
381k
        }
1049
381k
        intra_score += c->mb_penalty_factor*16 + s->intra_penalty;
1050
1051
381k
        if(intra_score < dmin){
1052
185k
            mb_type= CANDIDATE_MB_TYPE_INTRA;
1053
185k
            s->c.cur_pic.mb_type[mb_y*s->c.mb_stride + mb_x] = CANDIDATE_MB_TYPE_INTRA; //FIXME cleanup
1054
185k
        }else
1055
196k
            s->c.cur_pic.mb_type[mb_y*s->c.mb_stride + mb_x] = 0;
1056
1057
381k
        {
1058
381k
            int p_score = FFMIN(vard, varc-500+(s->lambda2>>FF_LAMBDA_SHIFT)*100);
1059
381k
            int i_score = varc-500+(s->lambda2>>FF_LAMBDA_SHIFT)*20;
1060
381k
            c->scene_change_score+= ff_sqrt(p_score) - ff_sqrt(i_score);
1061
381k
        }
1062
381k
    }
1063
1064
381k
    s->mb_type[mb_y*s->c.mb_stride + mb_x] = mb_type;
1065
381k
}
1066
1067
int ff_pre_estimate_p_frame_motion(MPVEncContext *const s,
1068
                                    int mb_x, int mb_y)
1069
0
{
1070
0
    MotionEstContext *const c = &s->me;
1071
0
    int mx, my, dmin;
1072
0
    int P[10][2];
1073
0
    const int shift = 1 + s->c.quarter_sample;
1074
0
    const int xy    = mb_x + mb_y*s->c.mb_stride;
1075
0
    init_ref(c, s->new_pic->data, s->c.last_pic.data, NULL, 16*mb_x, 16*mb_y, 0);
1076
1077
0
    av_assert0(s->c.quarter_sample == 0 || s->c.quarter_sample == 1);
1078
1079
0
    c->pre_penalty_factor = get_penalty_factor(s->lambda, s->lambda2, c->avctx->me_pre_cmp);
1080
0
    c->current_mv_penalty = c->mv_penalty[s->f_code] + MAX_DMV;
1081
1082
0
    get_limits(s, 16*mb_x, 16*mb_y, 0);
1083
0
    c->skip=0;
1084
1085
0
    P_LEFT[0]       = s->p_mv_table[xy + 1][0];
1086
0
    P_LEFT[1]       = s->p_mv_table[xy + 1][1];
1087
1088
0
    if(P_LEFT[0]       < (c->xmin<<shift)) P_LEFT[0]       = (c->xmin<<shift);
1089
1090
    /* special case for first line */
1091
0
    if (s->c.first_slice_line) {
1092
0
        c->pred_x= P_LEFT[0];
1093
0
        c->pred_y= P_LEFT[1];
1094
0
        P_TOP[0]= P_TOPRIGHT[0]= P_MEDIAN[0]=
1095
0
        P_TOP[1]= P_TOPRIGHT[1]= P_MEDIAN[1]= 0; //FIXME
1096
0
    } else {
1097
0
        P_TOP[0]      = s->p_mv_table[xy + s->c.mb_stride    ][0];
1098
0
        P_TOP[1]      = s->p_mv_table[xy + s->c.mb_stride    ][1];
1099
0
        P_TOPRIGHT[0] = s->p_mv_table[xy + s->c.mb_stride - 1][0];
1100
0
        P_TOPRIGHT[1] = s->p_mv_table[xy + s->c.mb_stride - 1][1];
1101
0
        if(P_TOP[1]      < (c->ymin<<shift)) P_TOP[1]     = (c->ymin<<shift);
1102
0
        if(P_TOPRIGHT[0] > (c->xmax<<shift)) P_TOPRIGHT[0]= (c->xmax<<shift);
1103
0
        if(P_TOPRIGHT[1] < (c->ymin<<shift)) P_TOPRIGHT[1]= (c->ymin<<shift);
1104
1105
0
        P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]);
1106
0
        P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]);
1107
1108
0
        c->pred_x = P_MEDIAN[0];
1109
0
        c->pred_y = P_MEDIAN[1];
1110
0
    }
1111
1112
0
    dmin = ff_epzs_motion_search(s, &mx, &my, P, 0, 0, s->p_mv_table, (1<<16)>>shift, 0, 16);
1113
1114
0
    s->p_mv_table[xy][0] = mx<<shift;
1115
0
    s->p_mv_table[xy][1] = my<<shift;
1116
1117
0
    return dmin;
1118
0
}
1119
1120
static int estimate_motion_b(MPVEncContext *const s, int mb_x, int mb_y,
1121
                             int16_t (*mv_table)[2], int ref_index, int f_code)
1122
0
{
1123
0
    MotionEstContext *const c = &s->me;
1124
0
    int mx = 0, my = 0, dmin = 0;
1125
0
    int P[10][2];
1126
0
    const int shift= 1+s->c.quarter_sample;
1127
0
    const int mot_stride = s->c.mb_stride;
1128
0
    const int mot_xy = mb_y*mot_stride + mb_x;
1129
0
    const uint8_t * const mv_penalty = c->mv_penalty[f_code] + MAX_DMV;
1130
0
    int mv_scale;
1131
1132
0
    c->current_mv_penalty= mv_penalty;
1133
1134
0
    get_limits(s, 16*mb_x, 16*mb_y, 1);
1135
1136
0
    if (c->motion_est != FF_ME_ZERO) {
1137
0
        P_LEFT[0] = mv_table[mot_xy - 1][0];
1138
0
        P_LEFT[1] = mv_table[mot_xy - 1][1];
1139
1140
0
        if (P_LEFT[0] > (c->xmax << shift)) P_LEFT[0] = (c->xmax << shift);
1141
1142
        /* special case for first line */
1143
0
        if (!s->c.first_slice_line) {
1144
0
            P_TOP[0]      = mv_table[mot_xy - mot_stride    ][0];
1145
0
            P_TOP[1]      = mv_table[mot_xy - mot_stride    ][1];
1146
0
            P_TOPRIGHT[0] = mv_table[mot_xy - mot_stride + 1][0];
1147
0
            P_TOPRIGHT[1] = mv_table[mot_xy - mot_stride + 1][1];
1148
0
            if (P_TOP[1] > (c->ymax << shift)) P_TOP[1] = (c->ymax << shift);
1149
0
            if (P_TOPRIGHT[0] < c->xmin * (1 << shift)) P_TOPRIGHT[0] = c->xmin * (1 << shift);
1150
0
            if (P_TOPRIGHT[1] > (c->ymax << shift)) P_TOPRIGHT[1] = (c->ymax << shift);
1151
1152
0
            P_MEDIAN[0] = mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]);
1153
0
            P_MEDIAN[1] = mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]);
1154
0
        }
1155
0
        c->pred_x = P_LEFT[0];
1156
0
        c->pred_y = P_LEFT[1];
1157
1158
0
        if(mv_table == s->b_forw_mv_table){
1159
0
            mv_scale= (s->c.pb_time<<16) / (s->c.pp_time<<shift);
1160
0
        }else{
1161
0
            mv_scale = ((s->c.pb_time - s->c.pp_time) * (1 << 16)) / (s->c.pp_time<<shift);
1162
0
        }
1163
1164
0
        dmin = ff_epzs_motion_search(s, &mx, &my, P, 0, ref_index, s->p_mv_table, mv_scale, 0, 16);
1165
0
    }
1166
1167
0
    dmin= c->sub_motion_search(s, &mx, &my, dmin, 0, ref_index, 0, 16);
1168
1169
0
    if(c->avctx->me_sub_cmp != c->avctx->mb_cmp && !c->skip)
1170
0
        dmin= get_mb_score(s, mx, my, 0, ref_index, 0, 16, 1);
1171
1172
//    s->mb_type[mb_y*s->c.mb_width + mb_x]= mb_type;
1173
0
    mv_table[mot_xy][0]= mx;
1174
0
    mv_table[mot_xy][1]= my;
1175
1176
0
    return dmin;
1177
0
}
1178
1179
static inline int check_bidir_mv(MPVEncContext *const s,
1180
                   int motion_fx, int motion_fy,
1181
                   int motion_bx, int motion_by,
1182
                   int pred_fx, int pred_fy,
1183
                   int pred_bx, int pred_by,
1184
                   int size, int h)
1185
0
{
1186
    //FIXME optimize?
1187
    //FIXME better f_code prediction (max mv & distance)
1188
    //FIXME pointers
1189
0
    MotionEstContext *const c = &s->me;
1190
0
    const uint8_t * const mv_penalty_f = c->mv_penalty[s->f_code] + MAX_DMV; // f_code of the prev frame
1191
0
    const uint8_t * const mv_penalty_b = c->mv_penalty[s->b_code] + MAX_DMV; // f_code of the prev frame
1192
0
    int stride= c->stride;
1193
0
    uint8_t *dest_y = c->scratchpad;
1194
0
    const uint8_t *ptr;
1195
0
    int dxy;
1196
0
    int src_x, src_y;
1197
0
    int fbmin;
1198
0
    const uint8_t *const *src_data  = c->src[0];
1199
0
    const uint8_t *const *ref_data  = c->ref[0];
1200
0
    const uint8_t *const *ref2_data = c->ref[2];
1201
1202
0
    if(s->c.quarter_sample){
1203
0
        dxy = ((motion_fy & 3) << 2) | (motion_fx & 3);
1204
0
        src_x = motion_fx >> 2;
1205
0
        src_y = motion_fy >> 2;
1206
1207
0
        ptr = ref_data[0] + (src_y * stride) + src_x;
1208
0
        s->c.qdsp.put_qpel_pixels_tab[0][dxy](dest_y, ptr, stride);
1209
1210
0
        dxy = ((motion_by & 3) << 2) | (motion_bx & 3);
1211
0
        src_x = motion_bx >> 2;
1212
0
        src_y = motion_by >> 2;
1213
1214
0
        ptr = ref2_data[0] + (src_y * stride) + src_x;
1215
0
        s->c.qdsp.avg_qpel_pixels_tab[size][dxy](dest_y, ptr, stride);
1216
0
    }else{
1217
0
        dxy = ((motion_fy & 1) << 1) | (motion_fx & 1);
1218
0
        src_x = motion_fx >> 1;
1219
0
        src_y = motion_fy >> 1;
1220
1221
0
        ptr = ref_data[0] + (src_y * stride) + src_x;
1222
0
        s->c.hdsp.put_pixels_tab[size][dxy](dest_y    , ptr    , stride, h);
1223
1224
0
        dxy = ((motion_by & 1) << 1) | (motion_bx & 1);
1225
0
        src_x = motion_bx >> 1;
1226
0
        src_y = motion_by >> 1;
1227
1228
0
        ptr = ref2_data[0] + (src_y * stride) + src_x;
1229
0
        s->c.hdsp.avg_pixels_tab[size][dxy](dest_y    , ptr    , stride, h);
1230
0
    }
1231
1232
0
    fbmin = (mv_penalty_f[motion_fx-pred_fx] + mv_penalty_f[motion_fy-pred_fy])*c->mb_penalty_factor
1233
0
           +(mv_penalty_b[motion_bx-pred_bx] + mv_penalty_b[motion_by-pred_by])*c->mb_penalty_factor
1234
0
           + c->mb_cmp[size](s, src_data[0], dest_y, stride, h); // FIXME new_pic
1235
1236
0
    if(c->avctx->mb_cmp&FF_CMP_CHROMA){
1237
0
    }
1238
    //FIXME CHROMA !!!
1239
1240
0
    return fbmin;
1241
0
}
1242
1243
/* refine the bidir vectors in hq mode and return the score in both lq & hq mode*/
1244
static inline int bidir_refine(MPVEncContext *const s, int mb_x, int mb_y)
1245
0
{
1246
0
    MotionEstContext *const c = &s->me;
1247
0
    const int mot_stride = s->c.mb_stride;
1248
0
    const int xy = mb_y *mot_stride + mb_x;
1249
0
    int fbmin;
1250
0
    int pred_fx= s->b_bidir_forw_mv_table[xy-1][0];
1251
0
    int pred_fy= s->b_bidir_forw_mv_table[xy-1][1];
1252
0
    int pred_bx= s->b_bidir_back_mv_table[xy-1][0];
1253
0
    int pred_by= s->b_bidir_back_mv_table[xy-1][1];
1254
0
    int motion_fx= s->b_bidir_forw_mv_table[xy][0]= s->b_forw_mv_table[xy][0];
1255
0
    int motion_fy= s->b_bidir_forw_mv_table[xy][1]= s->b_forw_mv_table[xy][1];
1256
0
    int motion_bx= s->b_bidir_back_mv_table[xy][0]= s->b_back_mv_table[xy][0];
1257
0
    int motion_by= s->b_bidir_back_mv_table[xy][1]= s->b_back_mv_table[xy][1];
1258
0
    const int flags= c->sub_flags;
1259
0
    const int qpel= flags&FLAG_QPEL;
1260
0
    const int shift= 1+qpel;
1261
0
    const int xmin= c->xmin * (1 << shift);
1262
0
    const int ymin= c->ymin * (1 << shift);
1263
0
    const int xmax= c->xmax<<shift;
1264
0
    const int ymax= c->ymax<<shift;
1265
0
#define HASH(fx,fy,bx,by) ((fx)+17*(fy)+63*(bx)+117*(by))
1266
0
#define HASH8(fx,fy,bx,by) ((uint8_t)HASH(fx,fy,bx,by))
1267
0
    int hashidx= HASH(motion_fx,motion_fy, motion_bx, motion_by);
1268
0
    uint8_t map[256] = { 0 };
1269
1270
0
    map[hashidx&255] = 1;
1271
1272
0
    fbmin= check_bidir_mv(s, motion_fx, motion_fy,
1273
0
                          motion_bx, motion_by,
1274
0
                          pred_fx, pred_fy,
1275
0
                          pred_bx, pred_by,
1276
0
                          0, 16);
1277
1278
0
    if (c->avctx->bidir_refine) {
1279
0
        int end;
1280
0
        static const uint8_t limittab[5]={0,8,32,64,80};
1281
0
        const int limit = limittab[c->avctx->bidir_refine];
1282
0
        static const int8_t vect[][4]={
1283
0
{ 0, 0, 0, 1}, { 0, 0, 0,-1}, { 0, 0, 1, 0}, { 0, 0,-1, 0}, { 0, 1, 0, 0}, { 0,-1, 0, 0}, { 1, 0, 0, 0}, {-1, 0, 0, 0},
1284
1285
0
{ 0, 0, 1, 1}, { 0, 0,-1,-1}, { 0, 1, 1, 0}, { 0,-1,-1, 0}, { 1, 1, 0, 0}, {-1,-1, 0, 0}, { 1, 0, 0, 1}, {-1, 0, 0,-1},
1286
0
{ 0, 1, 0, 1}, { 0,-1, 0,-1}, { 1, 0, 1, 0}, {-1, 0,-1, 0},
1287
0
{ 0, 0,-1, 1}, { 0, 0, 1,-1}, { 0,-1, 1, 0}, { 0, 1,-1, 0}, {-1, 1, 0, 0}, { 1,-1, 0, 0}, { 1, 0, 0,-1}, {-1, 0, 0, 1},
1288
0
{ 0,-1, 0, 1}, { 0, 1, 0,-1}, {-1, 0, 1, 0}, { 1, 0,-1, 0},
1289
1290
0
{ 0, 1, 1, 1}, { 0,-1,-1,-1}, { 1, 1, 1, 0}, {-1,-1,-1, 0}, { 1, 1, 0, 1}, {-1,-1, 0,-1}, { 1, 0, 1, 1}, {-1, 0,-1,-1},
1291
0
{ 0,-1, 1, 1}, { 0, 1,-1,-1}, {-1, 1, 1, 0}, { 1,-1,-1, 0}, { 1, 1, 0,-1}, {-1,-1, 0, 1}, { 1, 0,-1, 1}, {-1, 0, 1,-1},
1292
0
{ 0, 1,-1, 1}, { 0,-1, 1,-1}, { 1,-1, 1, 0}, {-1, 1,-1, 0}, {-1, 1, 0, 1}, { 1,-1, 0,-1}, { 1, 0, 1,-1}, {-1, 0,-1, 1},
1293
0
{ 0, 1, 1,-1}, { 0,-1,-1, 1}, { 1, 1,-1, 0}, {-1,-1, 1, 0}, { 1,-1, 0, 1}, {-1, 1, 0,-1}, {-1, 0, 1, 1}, { 1, 0,-1,-1},
1294
1295
0
{ 1, 1, 1, 1}, {-1,-1,-1,-1},
1296
0
{ 1, 1, 1,-1}, {-1,-1,-1, 1}, { 1, 1,-1, 1}, {-1,-1, 1,-1}, { 1,-1, 1, 1}, {-1, 1,-1,-1}, {-1, 1, 1, 1}, { 1,-1,-1,-1},
1297
0
{ 1, 1,-1,-1}, {-1,-1, 1, 1}, { 1,-1,-1, 1}, {-1, 1, 1,-1}, { 1,-1, 1,-1}, {-1, 1,-1, 1},
1298
0
        };
1299
0
        static const uint8_t hash[]={
1300
0
HASH8( 0, 0, 0, 1), HASH8( 0, 0, 0,-1), HASH8( 0, 0, 1, 0), HASH8( 0, 0,-1, 0), HASH8( 0, 1, 0, 0), HASH8( 0,-1, 0, 0), HASH8( 1, 0, 0, 0), HASH8(-1, 0, 0, 0),
1301
1302
0
HASH8( 0, 0, 1, 1), HASH8( 0, 0,-1,-1), HASH8( 0, 1, 1, 0), HASH8( 0,-1,-1, 0), HASH8( 1, 1, 0, 0), HASH8(-1,-1, 0, 0), HASH8( 1, 0, 0, 1), HASH8(-1, 0, 0,-1),
1303
0
HASH8( 0, 1, 0, 1), HASH8( 0,-1, 0,-1), HASH8( 1, 0, 1, 0), HASH8(-1, 0,-1, 0),
1304
0
HASH8( 0, 0,-1, 1), HASH8( 0, 0, 1,-1), HASH8( 0,-1, 1, 0), HASH8( 0, 1,-1, 0), HASH8(-1, 1, 0, 0), HASH8( 1,-1, 0, 0), HASH8( 1, 0, 0,-1), HASH8(-1, 0, 0, 1),
1305
0
HASH8( 0,-1, 0, 1), HASH8( 0, 1, 0,-1), HASH8(-1, 0, 1, 0), HASH8( 1, 0,-1, 0),
1306
1307
0
HASH8( 0, 1, 1, 1), HASH8( 0,-1,-1,-1), HASH8( 1, 1, 1, 0), HASH8(-1,-1,-1, 0), HASH8( 1, 1, 0, 1), HASH8(-1,-1, 0,-1), HASH8( 1, 0, 1, 1), HASH8(-1, 0,-1,-1),
1308
0
HASH8( 0,-1, 1, 1), HASH8( 0, 1,-1,-1), HASH8(-1, 1, 1, 0), HASH8( 1,-1,-1, 0), HASH8( 1, 1, 0,-1), HASH8(-1,-1, 0, 1), HASH8( 1, 0,-1, 1), HASH8(-1, 0, 1,-1),
1309
0
HASH8( 0, 1,-1, 1), HASH8( 0,-1, 1,-1), HASH8( 1,-1, 1, 0), HASH8(-1, 1,-1, 0), HASH8(-1, 1, 0, 1), HASH8( 1,-1, 0,-1), HASH8( 1, 0, 1,-1), HASH8(-1, 0,-1, 1),
1310
0
HASH8( 0, 1, 1,-1), HASH8( 0,-1,-1, 1), HASH8( 1, 1,-1, 0), HASH8(-1,-1, 1, 0), HASH8( 1,-1, 0, 1), HASH8(-1, 1, 0,-1), HASH8(-1, 0, 1, 1), HASH8( 1, 0,-1,-1),
1311
1312
0
HASH8( 1, 1, 1, 1), HASH8(-1,-1,-1,-1),
1313
0
HASH8( 1, 1, 1,-1), HASH8(-1,-1,-1, 1), HASH8( 1, 1,-1, 1), HASH8(-1,-1, 1,-1), HASH8( 1,-1, 1, 1), HASH8(-1, 1,-1,-1), HASH8(-1, 1, 1, 1), HASH8( 1,-1,-1,-1),
1314
0
HASH8( 1, 1,-1,-1), HASH8(-1,-1, 1, 1), HASH8( 1,-1,-1, 1), HASH8(-1, 1, 1,-1), HASH8( 1,-1, 1,-1), HASH8(-1, 1,-1, 1),
1315
0
};
1316
1317
0
#define CHECK_BIDIR(fx,fy,bx,by)\
1318
0
    if( !map[(hashidx+HASH(fx,fy,bx,by))&255]\
1319
0
       &&(fx<=0 || motion_fx+fx<=xmax) && (fy<=0 || motion_fy+fy<=ymax) && (bx<=0 || motion_bx+bx<=xmax) && (by<=0 || motion_by+by<=ymax)\
1320
0
       &&(fx>=0 || motion_fx+fx>=xmin) && (fy>=0 || motion_fy+fy>=ymin) && (bx>=0 || motion_bx+bx>=xmin) && (by>=0 || motion_by+by>=ymin)){\
1321
0
        int score;\
1322
0
        map[(hashidx+HASH(fx,fy,bx,by))&255] = 1;\
1323
0
        score= check_bidir_mv(s, motion_fx+fx, motion_fy+fy, motion_bx+bx, motion_by+by, pred_fx, pred_fy, pred_bx, pred_by, 0, 16);\
1324
0
        if(score < fbmin){\
1325
0
            hashidx += HASH(fx,fy,bx,by);\
1326
0
            fbmin= score;\
1327
0
            motion_fx+=fx;\
1328
0
            motion_fy+=fy;\
1329
0
            motion_bx+=bx;\
1330
0
            motion_by+=by;\
1331
0
            end=0;\
1332
0
        }\
1333
0
    }
1334
0
#define CHECK_BIDIR2(a,b,c,d)\
1335
0
CHECK_BIDIR(a,b,c,d)\
1336
0
CHECK_BIDIR(-(a),-(b),-(c),-(d))
1337
1338
0
        do{
1339
0
            int i;
1340
0
            int borderdist=0;
1341
0
            end=1;
1342
1343
0
            CHECK_BIDIR2(0,0,0,1)
1344
0
            CHECK_BIDIR2(0,0,1,0)
1345
0
            CHECK_BIDIR2(0,1,0,0)
1346
0
            CHECK_BIDIR2(1,0,0,0)
1347
1348
0
            for(i=8; i<limit; i++){
1349
0
                int fx= motion_fx+vect[i][0];
1350
0
                int fy= motion_fy+vect[i][1];
1351
0
                int bx= motion_bx+vect[i][2];
1352
0
                int by= motion_by+vect[i][3];
1353
0
                if(borderdist<=0){
1354
0
                    int a= (xmax - FFMAX(fx,bx))|(FFMIN(fx,bx) - xmin);
1355
0
                    int b= (ymax - FFMAX(fy,by))|(FFMIN(fy,by) - ymin);
1356
0
                    if((a|b) < 0)
1357
0
                        map[(hashidx+hash[i])&255] = 1;
1358
0
                }
1359
0
                if(!map[(hashidx+hash[i])&255]){
1360
0
                    int score;
1361
0
                    map[(hashidx+hash[i])&255] = 1;
1362
0
                    score= check_bidir_mv(s, fx, fy, bx, by, pred_fx, pred_fy, pred_bx, pred_by, 0, 16);
1363
0
                    if(score < fbmin){
1364
0
                        hashidx += hash[i];
1365
0
                        fbmin= score;
1366
0
                        motion_fx=fx;
1367
0
                        motion_fy=fy;
1368
0
                        motion_bx=bx;
1369
0
                        motion_by=by;
1370
0
                        end=0;
1371
0
                        borderdist--;
1372
0
                        if(borderdist<=0){
1373
0
                            int a= FFMIN(xmax - FFMAX(fx,bx), FFMIN(fx,bx) - xmin);
1374
0
                            int b= FFMIN(ymax - FFMAX(fy,by), FFMIN(fy,by) - ymin);
1375
0
                            borderdist= FFMIN(a,b);
1376
0
                        }
1377
0
                    }
1378
0
                }
1379
0
            }
1380
0
        }while(!end);
1381
0
    }
1382
1383
0
    s->b_bidir_forw_mv_table[xy][0]= motion_fx;
1384
0
    s->b_bidir_forw_mv_table[xy][1]= motion_fy;
1385
0
    s->b_bidir_back_mv_table[xy][0]= motion_bx;
1386
0
    s->b_bidir_back_mv_table[xy][1]= motion_by;
1387
1388
0
    return fbmin;
1389
0
}
1390
1391
static inline int direct_search(MPVEncContext *const s, int mb_x, int mb_y)
1392
0
{
1393
0
    MotionEstContext *const c = &s->me;
1394
0
    int P[10][2];
1395
0
    const int mot_stride = s->c.mb_stride;
1396
0
    const int mot_xy = mb_y*mot_stride + mb_x;
1397
0
    const int shift= 1+s->c.quarter_sample;
1398
0
    int dmin, i;
1399
0
    const int time_pp= s->c.pp_time;
1400
0
    const int time_pb= s->c.pb_time;
1401
0
    int mx, my, xmin, xmax, ymin, ymax;
1402
0
    int16_t (*mv_table)[2]= s->b_direct_mv_table;
1403
1404
0
    c->current_mv_penalty= c->mv_penalty[1] + MAX_DMV;
1405
0
    ymin= xmin=(-32)>>shift;
1406
0
    ymax= xmax=   31>>shift;
1407
1408
0
    if (IS_8X8(s->c.next_pic.mb_type[mot_xy])) {
1409
0
        s->c.mv_type = MV_TYPE_8X8;
1410
0
    }else{
1411
0
        s->c.mv_type = MV_TYPE_16X16;
1412
0
    }
1413
1414
0
    for(i=0; i<4; i++){
1415
0
        int index= s->c.block_index[i];
1416
0
        int min, max;
1417
1418
0
        c->co_located_mv[i][0] = s->c.next_pic.motion_val[0][index][0];
1419
0
        c->co_located_mv[i][1] = s->c.next_pic.motion_val[0][index][1];
1420
0
        c->direct_basis_mv[i][0]= c->co_located_mv[i][0]*time_pb/time_pp + ((i& 1)<<(shift+3));
1421
0
        c->direct_basis_mv[i][1]= c->co_located_mv[i][1]*time_pb/time_pp + ((i>>1)<<(shift+3));
1422
//        c->direct_basis_mv[1][i][0]= c->co_located_mv[i][0]*(time_pb - time_pp)/time_pp + ((i &1)<<(shift+3);
1423
//        c->direct_basis_mv[1][i][1]= c->co_located_mv[i][1]*(time_pb - time_pp)/time_pp + ((i>>1)<<(shift+3);
1424
1425
0
        max= FFMAX(c->direct_basis_mv[i][0], c->direct_basis_mv[i][0] - c->co_located_mv[i][0])>>shift;
1426
0
        min= FFMIN(c->direct_basis_mv[i][0], c->direct_basis_mv[i][0] - c->co_located_mv[i][0])>>shift;
1427
0
        max+= 16*mb_x + 1; // +-1 is for the simpler rounding
1428
0
        min+= 16*mb_x - 1;
1429
0
        xmax= FFMIN(xmax, s->c.width - max);
1430
0
        xmin= FFMAX(xmin, - 16     - min);
1431
1432
0
        max= FFMAX(c->direct_basis_mv[i][1], c->direct_basis_mv[i][1] - c->co_located_mv[i][1])>>shift;
1433
0
        min= FFMIN(c->direct_basis_mv[i][1], c->direct_basis_mv[i][1] - c->co_located_mv[i][1])>>shift;
1434
0
        max+= 16*mb_y + 1; // +-1 is for the simpler rounding
1435
0
        min+= 16*mb_y - 1;
1436
0
        ymax= FFMIN(ymax, s->c.height - max);
1437
0
        ymin= FFMAX(ymin, - 16      - min);
1438
1439
0
        if(s->c.mv_type == MV_TYPE_16X16) break;
1440
0
    }
1441
1442
0
    av_assert2(xmax <= 15 && ymax <= 15 && xmin >= -16 && ymin >= -16);
1443
1444
0
    if(xmax < 0 || xmin >0 || ymax < 0 || ymin > 0){
1445
0
        s->b_direct_mv_table[mot_xy][0]= 0;
1446
0
        s->b_direct_mv_table[mot_xy][1]= 0;
1447
1448
0
        return 256*256*256*64-1;
1449
0
    }
1450
1451
0
    c->xmin= xmin;
1452
0
    c->ymin= ymin;
1453
0
    c->xmax= xmax;
1454
0
    c->ymax= ymax;
1455
0
    c->flags     |= FLAG_DIRECT;
1456
0
    c->sub_flags |= FLAG_DIRECT;
1457
0
    c->pred_x=0;
1458
0
    c->pred_y=0;
1459
1460
0
    P_LEFT[0] = av_clip(mv_table[mot_xy - 1][0], xmin * (1 << shift), xmax << shift);
1461
0
    P_LEFT[1] = av_clip(mv_table[mot_xy - 1][1], ymin * (1 << shift), ymax << shift);
1462
1463
    /* special case for first line */
1464
0
    if (!s->c.first_slice_line) { //FIXME maybe allow this over thread boundary as it is clipped
1465
0
        P_TOP[0]      = av_clip(mv_table[mot_xy - mot_stride    ][0], xmin * (1 << shift), xmax << shift);
1466
0
        P_TOP[1]      = av_clip(mv_table[mot_xy - mot_stride    ][1], ymin * (1 << shift), ymax << shift);
1467
0
        P_TOPRIGHT[0] = av_clip(mv_table[mot_xy - mot_stride + 1][0], xmin * (1 << shift), xmax << shift);
1468
0
        P_TOPRIGHT[1] = av_clip(mv_table[mot_xy - mot_stride + 1][1], ymin * (1 << shift), ymax << shift);
1469
1470
0
        P_MEDIAN[0]= mid_pred(P_LEFT[0], P_TOP[0], P_TOPRIGHT[0]);
1471
0
        P_MEDIAN[1]= mid_pred(P_LEFT[1], P_TOP[1], P_TOPRIGHT[1]);
1472
0
    }
1473
1474
0
    dmin = ff_epzs_motion_search(s, &mx, &my, P, 0, 0, mv_table, 1<<(16-shift), 0, 16);
1475
0
    if(c->sub_flags&FLAG_QPEL)
1476
0
        dmin = qpel_motion_search(s, &mx, &my, dmin, 0, 0, 0, 16);
1477
0
    else
1478
0
        dmin = hpel_motion_search(s, &mx, &my, dmin, 0, 0, 0, 16);
1479
1480
0
    if(c->avctx->me_sub_cmp != c->avctx->mb_cmp && !c->skip)
1481
0
        dmin= get_mb_score(s, mx, my, 0, 0, 0, 16, 1);
1482
1483
0
    get_limits(s, 16*mb_x, 16*mb_y, 1); //restore c->?min/max, maybe not needed
1484
1485
0
    mv_table[mot_xy][0]= mx;
1486
0
    mv_table[mot_xy][1]= my;
1487
0
    c->flags     &= ~FLAG_DIRECT;
1488
0
    c->sub_flags &= ~FLAG_DIRECT;
1489
1490
0
    return dmin;
1491
0
}
1492
1493
void ff_estimate_b_frame_motion(MPVEncContext *const s,
1494
                             int mb_x, int mb_y)
1495
0
{
1496
0
    MotionEstContext *const c = &s->me;
1497
0
    int fmin, bmin, dmin, fbmin, bimin, fimin;
1498
0
    int type=0;
1499
0
    const int xy = mb_y*s->c.mb_stride + mb_x;
1500
0
    init_ref(c, s->new_pic->data, s->c.last_pic.data,
1501
0
             s->c.next_pic.data, 16 * mb_x, 16 * mb_y, 2);
1502
1503
0
    get_limits(s, 16*mb_x, 16*mb_y, 1);
1504
1505
0
    c->skip=0;
1506
1507
0
    if (s->c.codec_id == AV_CODEC_ID_MPEG4 && s->c.next_pic.mbskip_table[xy]) {
1508
0
        int score= direct_search(s, mb_x, mb_y); //FIXME just check 0,0
1509
1510
0
        score= ((unsigned)(score*score + 128*256))>>16;
1511
0
        c->mc_mb_var_sum_temp += score;
1512
0
        s->mc_mb_var[mb_y*s->c.mb_stride + mb_x] = score; //FIXME use SSE
1513
0
        s->mb_type[mb_y*s->c.mb_stride + mb_x]= CANDIDATE_MB_TYPE_DIRECT0;
1514
1515
0
        return;
1516
0
    }
1517
1518
0
    c->penalty_factor    = get_penalty_factor(s->lambda, s->lambda2, c->avctx->me_cmp);
1519
0
    c->sub_penalty_factor= get_penalty_factor(s->lambda, s->lambda2, c->avctx->me_sub_cmp);
1520
0
    c->mb_penalty_factor = get_penalty_factor(s->lambda, s->lambda2, c->avctx->mb_cmp);
1521
1522
0
    if (s->c.codec_id == AV_CODEC_ID_MPEG4)
1523
0
        dmin= direct_search(s, mb_x, mb_y);
1524
0
    else
1525
0
        dmin= INT_MAX;
1526
1527
// FIXME penalty stuff for non-MPEG-4
1528
0
    c->skip=0;
1529
0
    fmin = estimate_motion_b(s, mb_x, mb_y, s->b_forw_mv_table, 0, s->f_code) +
1530
0
           3 * c->mb_penalty_factor;
1531
1532
0
    c->skip=0;
1533
0
    bmin = estimate_motion_b(s, mb_x, mb_y, s->b_back_mv_table, 2, s->b_code) +
1534
0
           2 * c->mb_penalty_factor;
1535
0
    ff_dlog(c->avctx, " %d %d ", s->b_forw_mv_table[xy][0], s->b_forw_mv_table[xy][1]);
1536
1537
0
    c->skip=0;
1538
0
    fbmin= bidir_refine(s, mb_x, mb_y) + c->mb_penalty_factor;
1539
0
    ff_dlog(c->avctx, "%d %d %d %d\n", dmin, fmin, bmin, fbmin);
1540
1541
0
    if (c->avctx->flags & AV_CODEC_FLAG_INTERLACED_ME) {
1542
//FIXME mb type penalty
1543
0
        c->skip=0;
1544
0
        c->current_mv_penalty = c->mv_penalty[s->f_code] + MAX_DMV;
1545
0
        fimin= interlaced_search(s, 0,
1546
0
                                 s->b_field_mv_table[0], s->b_field_select_table[0],
1547
0
                                 s->b_forw_mv_table[xy][0], s->b_forw_mv_table[xy][1], 0);
1548
0
        c->current_mv_penalty = c->mv_penalty[s->b_code] + MAX_DMV;
1549
0
        bimin= interlaced_search(s, 2,
1550
0
                                 s->b_field_mv_table[1], s->b_field_select_table[1],
1551
0
                                 s->b_back_mv_table[xy][0], s->b_back_mv_table[xy][1], 0);
1552
0
    }else
1553
0
        fimin= bimin= INT_MAX;
1554
1555
0
    {
1556
0
        int score= fmin;
1557
0
        type = CANDIDATE_MB_TYPE_FORWARD;
1558
1559
0
        if (dmin <= score){
1560
0
            score = dmin;
1561
0
            type = CANDIDATE_MB_TYPE_DIRECT;
1562
0
        }
1563
0
        if(bmin<score){
1564
0
            score=bmin;
1565
0
            type= CANDIDATE_MB_TYPE_BACKWARD;
1566
0
        }
1567
0
        if(fbmin<score){
1568
0
            score=fbmin;
1569
0
            type= CANDIDATE_MB_TYPE_BIDIR;
1570
0
        }
1571
0
        if(fimin<score){
1572
0
            score=fimin;
1573
0
            type= CANDIDATE_MB_TYPE_FORWARD_I;
1574
0
        }
1575
0
        if(bimin<score){
1576
0
            score=bimin;
1577
0
            type= CANDIDATE_MB_TYPE_BACKWARD_I;
1578
0
        }
1579
1580
0
        score= ((unsigned)(score*score + 128*256))>>16;
1581
0
        c->mc_mb_var_sum_temp += score;
1582
0
        s->mc_mb_var[mb_y*s->c.mb_stride + mb_x] = score; //FIXME use SSE
1583
0
    }
1584
1585
0
    if(c->avctx->mb_decision > FF_MB_DECISION_SIMPLE){
1586
0
        type= CANDIDATE_MB_TYPE_FORWARD | CANDIDATE_MB_TYPE_BACKWARD | CANDIDATE_MB_TYPE_BIDIR | CANDIDATE_MB_TYPE_DIRECT;
1587
0
        if(fimin < INT_MAX)
1588
0
            type |= CANDIDATE_MB_TYPE_FORWARD_I;
1589
0
        if(bimin < INT_MAX)
1590
0
            type |= CANDIDATE_MB_TYPE_BACKWARD_I;
1591
0
        if(fimin < INT_MAX && bimin < INT_MAX){
1592
0
            type |= CANDIDATE_MB_TYPE_BIDIR_I;
1593
0
        }
1594
         //FIXME something smarter
1595
0
        if(dmin>256*256*16) type&= ~CANDIDATE_MB_TYPE_DIRECT; //do not try direct mode if it is invalid for this MB
1596
0
        if (s->c.codec_id == AV_CODEC_ID_MPEG4 && type&CANDIDATE_MB_TYPE_DIRECT &&
1597
0
            s->mpv_flags & FF_MPV_FLAG_MV0 && *(uint32_t*)s->b_direct_mv_table[xy])
1598
0
            type |= CANDIDATE_MB_TYPE_DIRECT0;
1599
0
    }
1600
1601
0
    s->mb_type[mb_y*s->c.mb_stride + mb_x]= type;
1602
0
}
1603
1604
/* find best f_code for ME which do unlimited searches */
1605
int ff_get_best_fcode(MPVMainEncContext *const m, const int16_t (*mv_table)[2], int type)
1606
0
{
1607
0
    MPVEncContext *const s = &m->s;
1608
0
    MotionEstContext *const c = &s->me;
1609
1610
0
    if (c->motion_est != FF_ME_ZERO) {
1611
0
        int score[8];
1612
0
        int i, range = c->avctx->me_range ? c->avctx->me_range : (INT_MAX/2);
1613
0
        const uint8_t * fcode_tab = m->fcode_tab;
1614
0
        int best_fcode=-1;
1615
0
        int best_score=-10000000;
1616
1617
0
        if (s->c.msmpeg4_version != MSMP4_UNUSED)
1618
0
            range= FFMIN(range, 16);
1619
0
        else if (s->c.codec_id == AV_CODEC_ID_MPEG2VIDEO &&
1620
0
                 c->avctx->strict_std_compliance >= FF_COMPLIANCE_NORMAL)
1621
0
            range= FFMIN(range, 256);
1622
1623
0
        for(i=0; i<8; i++) score[i]= s->c.mb_num*(8-i);
1624
1625
0
        for (int y = 0; y < s->c.mb_height; y++) {
1626
0
            int x;
1627
0
            int xy= y*s->c.mb_stride;
1628
0
            for(x=0; x<s->c.mb_width; x++, xy++){
1629
0
                if(s->mb_type[xy] & type){
1630
0
                    int mx= mv_table[xy][0];
1631
0
                    int my= mv_table[xy][1];
1632
0
                    int fcode = FFMAX(fcode_tab[mx], fcode_tab[my]);
1633
0
                    int j;
1634
1635
0
                    if (mx >= range || mx < -range ||
1636
0
                        my >= range || my < -range)
1637
0
                        continue;
1638
1639
0
                    for(j=0; j<fcode && j<8; j++){
1640
0
                        if (s->c.pict_type == AV_PICTURE_TYPE_B ||
1641
0
                            s->mc_mb_var[xy] < s->mb_var[xy])
1642
0
                            score[j]-= 170;
1643
0
                    }
1644
0
                }
1645
0
            }
1646
0
        }
1647
1648
0
        for(i=1; i<8; i++){
1649
0
            if(score[i] > best_score){
1650
0
                best_score= score[i];
1651
0
                best_fcode= i;
1652
0
            }
1653
0
        }
1654
1655
0
        return best_fcode;
1656
0
    }else{
1657
0
        return 1;
1658
0
    }
1659
0
}
1660
1661
void ff_fix_long_p_mvs(MPVEncContext *const s, int type)
1662
55.9k
{
1663
55.9k
    MotionEstContext *const c = &s->me;
1664
55.9k
    const int f_code= s->f_code;
1665
55.9k
    int y, range;
1666
55.9k
    av_assert0(s->c.pict_type == AV_PICTURE_TYPE_P);
1667
1668
55.9k
    range = (((s->c.out_format == FMT_MPEG1 || s->c.msmpeg4_version != MSMP4_UNUSED) ? 8 : 16) << f_code);
1669
1670
55.9k
    av_assert0(range <= 16 || s->c.msmpeg4_version == MSMP4_UNUSED);
1671
55.9k
    av_assert0(range <=256 || !(s->c.codec_id == AV_CODEC_ID_MPEG2VIDEO && c->avctx->strict_std_compliance >= FF_COMPLIANCE_NORMAL));
1672
1673
55.9k
    if(c->avctx->me_range && range > c->avctx->me_range) range= c->avctx->me_range;
1674
1675
55.9k
    if (c->avctx->flags & AV_CODEC_FLAG_4MV) {
1676
0
        const int wrap= s->c.b8_stride;
1677
1678
        /* clip / convert to intra 8x8 type MVs */
1679
0
        for(y=0; y<s->c.mb_height; y++){
1680
0
            int xy= y*2*wrap;
1681
0
            int i= y*s->c.mb_stride;
1682
0
            int x;
1683
1684
0
            for(x=0; x<s->c.mb_width; x++){
1685
0
                if(s->mb_type[i]&CANDIDATE_MB_TYPE_INTER4V){
1686
0
                    int block;
1687
0
                    for(block=0; block<4; block++){
1688
0
                        int off= (block& 1) + (block>>1)*wrap;
1689
0
                        int mx = s->c.cur_pic.motion_val[0][ xy + off ][0];
1690
0
                        int my = s->c.cur_pic.motion_val[0][ xy + off ][1];
1691
1692
0
                        if(   mx >=range || mx <-range
1693
0
                           || my >=range || my <-range){
1694
0
                            s->mb_type[i] &= ~CANDIDATE_MB_TYPE_INTER4V;
1695
0
                            s->mb_type[i] |= type;
1696
0
                            s->c.cur_pic.mb_type[i] = type;
1697
0
                        }
1698
0
                    }
1699
0
                }
1700
0
                xy+=2;
1701
0
                i++;
1702
0
            }
1703
0
        }
1704
0
    }
1705
55.9k
}
1706
1707
/**
1708
 * @param truncate 1 for truncation, 0 for using intra
1709
 */
1710
void ff_fix_long_mvs(MPVEncContext *const s, uint8_t *field_select_table, int field_select,
1711
                     int16_t (*mv_table)[2], int f_code, int type, int truncate)
1712
55.9k
{
1713
55.9k
    MotionEstContext *const c = &s->me;
1714
55.9k
    int y, h_range, v_range;
1715
1716
    // RAL: 8 in MPEG-1, 16 in MPEG-4
1717
55.9k
    int range = (((s->c.out_format == FMT_MPEG1 || s->c.msmpeg4_version != MSMP4_UNUSED) ? 8 : 16) << f_code);
1718
1719
55.9k
    if(c->avctx->me_range && range > c->avctx->me_range) range= c->avctx->me_range;
1720
1721
55.9k
    h_range= range;
1722
55.9k
    v_range= field_select_table ? range>>1 : range;
1723
1724
    /* clip / convert to intra 16x16 type MVs */
1725
162k
    for(y=0; y<s->c.mb_height; y++){
1726
106k
        int x;
1727
106k
        int xy= y*s->c.mb_stride;
1728
488k
        for(x=0; x<s->c.mb_width; x++){
1729
381k
            if (s->mb_type[xy] & type){    // RAL: "type" test added...
1730
196k
                if (!field_select_table || field_select_table[xy] == field_select) {
1731
196k
                    if(   mv_table[xy][0] >=h_range || mv_table[xy][0] <-h_range
1732
181k
                       || mv_table[xy][1] >=v_range || mv_table[xy][1] <-v_range){
1733
1734
28.1k
                        if(truncate){
1735
0
                            if     (mv_table[xy][0] > h_range-1) mv_table[xy][0]=  h_range-1;
1736
0
                            else if(mv_table[xy][0] < -h_range ) mv_table[xy][0]= -h_range;
1737
0
                            if     (mv_table[xy][1] > v_range-1) mv_table[xy][1]=  v_range-1;
1738
0
                            else if(mv_table[xy][1] < -v_range ) mv_table[xy][1]= -v_range;
1739
28.1k
                        }else{
1740
28.1k
                            s->mb_type[xy] &= ~type;
1741
28.1k
                            s->mb_type[xy] |= CANDIDATE_MB_TYPE_INTRA;
1742
28.1k
                            mv_table[xy][0]=
1743
28.1k
                            mv_table[xy][1]= 0;
1744
28.1k
                        }
1745
28.1k
                    }
1746
196k
                }
1747
196k
            }
1748
381k
            xy++;
1749
381k
        }
1750
106k
    }
1751
55.9k
}