common.h 34 KB
Newer Older
Laurent Aimar's avatar
Laurent Aimar committed
1
/*****************************************************************************
Fiona Glaser's avatar
Fiona Glaser committed
2
 * common.h: misc common functions
Laurent Aimar's avatar
Laurent Aimar committed
3
 *****************************************************************************
Henrik Gramner's avatar
Henrik Gramner committed
4
 * Copyright (C) 2003-2014 x264 project
Laurent Aimar's avatar
Laurent Aimar committed
5
6
 *
 * Authors: Laurent Aimar <fenrir@via.ecp.fr>
7
 *          Loren Merritt <lorenm@u.washington.edu>
Laurent Aimar's avatar
Laurent Aimar committed
8
9
10
11
12
13
14
15
16
17
18
19
20
 *
 * This program is free software; you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation; either version 2 of the License, or
 * (at your option) any later version.
 *
 * This program is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program; if not, write to the Free Software
21
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02111, USA.
Fiona Glaser's avatar
Fiona Glaser committed
22
23
24
 *
 * This program is also available under a commercial proprietary license.
 * For more information, contact us at licensing@x264.com.
Laurent Aimar's avatar
Laurent Aimar committed
25
26
 *****************************************************************************/

27
28
#ifndef X264_COMMON_H
#define X264_COMMON_H
Laurent Aimar's avatar
Laurent Aimar committed
29

Loren Merritt's avatar
Loren Merritt committed
30
31
32
33
34
35
36
37
38
/****************************************************************************
 * Macros
 ****************************************************************************/
#define X264_MIN(a,b) ( (a)<(b) ? (a) : (b) )
#define X264_MAX(a,b) ( (a)>(b) ? (a) : (b) )
#define X264_MIN3(a,b,c) X264_MIN((a),X264_MIN((b),(c)))
#define X264_MAX3(a,b,c) X264_MAX((a),X264_MAX((b),(c)))
#define X264_MIN4(a,b,c,d) X264_MIN((a),X264_MIN3((b),(c),(d)))
#define X264_MAX4(a,b,c,d) X264_MAX((a),X264_MAX3((b),(c),(d)))
39
#define XCHG(type,a,b) do{ type t = a; a = b; b = t; } while(0)
Lamont Alston's avatar
Lamont Alston committed
40
#define IS_DISPOSABLE(type) ( type == X264_TYPE_B )
Loren Merritt's avatar
Loren Merritt committed
41
#define FIX8(f) ((int)(f*(1<<8)+.5))
42
#define ALIGN(x,a) (((x)+((a)-1))&~((a)-1))
43
#define ARRAY_ELEMS(a) ((sizeof(a))/(sizeof(a[0])))
Loren Merritt's avatar
Loren Merritt committed
44

45
#define CHECKED_MALLOC( var, size )\
46
do {\
47
48
49
    var = x264_malloc( size );\
    if( !var )\
        goto fail;\
50
51
52
53
54
55
} while( 0 )
#define CHECKED_MALLOCZERO( var, size )\
do {\
    CHECKED_MALLOC( var, size );\
    memset( var, 0, size );\
} while( 0 )
56

Henrik Gramner's avatar
Henrik Gramner committed
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
/* Macros for merging multiple allocations into a single large malloc, for improved
 * use with huge pages. */

/* Needs to be enough to contain any set of buffers that use combined allocations */
#define PREALLOC_BUF_SIZE 1024

#define PREALLOC_INIT\
    int    prealloc_idx = 0;\
    size_t prealloc_size = 0;\
    uint8_t **preallocs[PREALLOC_BUF_SIZE];

#define PREALLOC( var, size )\
do {\
    var = (void*)prealloc_size;\
    preallocs[prealloc_idx++] = (uint8_t**)&var;\
    prealloc_size += ALIGN(size, NATIVE_ALIGN);\
} while(0)

#define PREALLOC_END( ptr )\
do {\
    CHECKED_MALLOC( ptr, prealloc_size );\
    while( prealloc_idx-- )\
        *preallocs[prealloc_idx] += (intptr_t)ptr;\
} while(0)

Steve Borho's avatar
Steve Borho committed
82
83
#define ARRAY_SIZE(array)  (sizeof(array)/sizeof(array[0]))

84
#define X264_BFRAME_MAX 16
85
#define X264_REF_MAX 16
86
#define X264_THREAD_MAX 128
Fiona Glaser's avatar
Fiona Glaser committed
87
#define X264_LOOKAHEAD_THREAD_MAX 16
Henrik Gramner's avatar
Henrik Gramner committed
88
#define X264_PCM_COST (FRAME_SIZE(256*BIT_DEPTH)+16)
Fiona Glaser's avatar
Fiona Glaser committed
89
#define X264_LOOKAHEAD_MAX 250
90
#define QP_BD_OFFSET (6*(BIT_DEPTH-8))
Fiona Glaser's avatar
Fiona Glaser committed
91
92
93
#define QP_MAX_SPEC (51+QP_BD_OFFSET)
#define QP_MAX (QP_MAX_SPEC+18)
#define QP_MAX_MAX (51+2*6+18)
94
#define PIXEL_MAX ((1 << BIT_DEPTH)-1)
95
// arbitrary, but low because SATD scores are 1/4 normal
96
#define X264_LOOKAHEAD_QP (12+QP_BD_OFFSET)
Fiona Glaser's avatar
Fiona Glaser committed
97
#define SPEC_QP(x) X264_MIN((x), QP_MAX_SPEC)
Loren Merritt's avatar
Loren Merritt committed
98
99
100
101

// number of pixels (per thread) in progress at any given time.
// 16 for the macroblock in progress + 3 for deblocking + 3 for motion compensation filter + 2 for extra safety
#define X264_THREAD_HEIGHT 24
102

Dylan Yudaken's avatar
Dylan Yudaken committed
103
104
105
106
107
108
109
/* WEIGHTP_FAKE is set when mb_tree & psy are enabled, but normal weightp is disabled
 * (such as in baseline). It checks for fades in lookahead and adjusts qp accordingly
 * to increase quality. Defined as (-1) so that if(i_weighted_pred > 0) is true only when
 * real weights are being used. */

#define X264_WEIGHTP_FAKE (-1)

110
111
#define NALU_OVERHEAD 5 // startcode + NAL type costs 5 bytes per frame
#define FILLER_OVERHEAD (NALU_OVERHEAD+1)
112
#define SEI_OVERHEAD (NALU_OVERHEAD - (h->param.b_annexb && !h->param.i_avcintra_class && (h->out.i_nal-1)))
113

Loren Merritt's avatar
Loren Merritt committed
114
115
116
/****************************************************************************
 * Includes
 ****************************************************************************/
117
#include "osdep.h"
118
#include <stdarg.h>
119
#include <stddef.h>
120
121
122
#include <stdlib.h>
#include <string.h>
#include <assert.h>
Fiona Glaser's avatar
Fiona Glaser committed
123
#include <limits.h>
Fiona Glaser's avatar
Fiona Glaser committed
124

125
126
127
128
129
130
131
132
133
134
#if HAVE_INTERLACED
#   define MB_INTERLACED h->mb.b_interlaced
#   define SLICE_MBAFF h->sh.b_mbaff
#   define PARAM_INTERLACED h->param.b_interlaced
#else
#   define MB_INTERLACED 0
#   define SLICE_MBAFF 0
#   define PARAM_INTERLACED 0
#endif

135
136
137
138
139
140
141
142
143
144
145
#ifdef CHROMA_FORMAT
#    define CHROMA_H_SHIFT (CHROMA_FORMAT == CHROMA_420 || CHROMA_FORMAT == CHROMA_422)
#    define CHROMA_V_SHIFT (CHROMA_FORMAT == CHROMA_420)
#else
#    define CHROMA_FORMAT h->sps->i_chroma_format_idc
#    define CHROMA_H_SHIFT h->mb.chroma_h_shift
#    define CHROMA_V_SHIFT h->mb.chroma_v_shift
#endif

#define CHROMA_SIZE(s) ((s)>>(CHROMA_H_SHIFT+CHROMA_V_SHIFT))
#define FRAME_SIZE(s) ((s)+2*CHROMA_SIZE(s))
Henrik Gramner's avatar
Henrik Gramner committed
146
#define CHROMA444 (CHROMA_FORMAT == CHROMA_444)
Fiona Glaser's avatar
Fiona Glaser committed
147

148
/* Unions for type-punning.
Fiona Glaser's avatar
Fiona Glaser committed
149
150
151
 * Mn: load or store n bits, aligned, native-endian
 * CPn: copy n bits, aligned, native-endian
 * we don't use memcpy for CPn because memcpy's args aren't assumed to be aligned */
152
153
154
typedef union { uint16_t i; uint8_t  c[2]; } MAY_ALIAS x264_union16_t;
typedef union { uint32_t i; uint16_t b[2]; uint8_t  c[4]; } MAY_ALIAS x264_union32_t;
typedef union { uint64_t i; uint32_t a[2]; uint16_t b[4]; uint8_t c[8]; } MAY_ALIAS x264_union64_t;
Fiona Glaser's avatar
Fiona Glaser committed
155
156
typedef struct { uint64_t i[2]; } x264_uint128_t;
typedef union { x264_uint128_t i; uint64_t a[2]; uint32_t b[4]; uint16_t c[8]; uint8_t d[16]; } MAY_ALIAS x264_union128_t;
Fiona Glaser's avatar
Fiona Glaser committed
157
158
159
#define M16(src) (((x264_union16_t*)(src))->i)
#define M32(src) (((x264_union32_t*)(src))->i)
#define M64(src) (((x264_union64_t*)(src))->i)
Fiona Glaser's avatar
Fiona Glaser committed
160
161
#define M128(src) (((x264_union128_t*)(src))->i)
#define M128_ZERO ((x264_uint128_t){{0,0}})
Fiona Glaser's avatar
Fiona Glaser committed
162
163
164
#define CP16(dst,src) M16(dst) = M16(src)
#define CP32(dst,src) M32(dst) = M32(src)
#define CP64(dst,src) M64(dst) = M64(src)
Fiona Glaser's avatar
Fiona Glaser committed
165
#define CP128(dst,src) M128(dst) = M128(src)
Fiona Glaser's avatar
Fiona Glaser committed
166

167
#if HIGH_BIT_DEPTH
168
169
170
    typedef uint16_t pixel;
    typedef uint64_t pixel4;
    typedef int32_t  dctcoef;
171
    typedef uint32_t udctcoef;
172

173
174
175
176
177
178
#   define PIXEL_SPLAT_X4(x) ((x)*0x0001000100010001ULL)
#   define MPIXEL_X4(src) M64(src)
#else
    typedef uint8_t  pixel;
    typedef uint32_t pixel4;
    typedef int16_t  dctcoef;
179
    typedef uint16_t udctcoef;
180
181
182
183
184

#   define PIXEL_SPLAT_X4(x) ((x)*0x01010101U)
#   define MPIXEL_X4(src) M32(src)
#endif

185
186
#define BIT_DEPTH X264_BIT_DEPTH

187
#define CPPIXEL_X4(dst,src) MPIXEL_X4(dst) = MPIXEL_X4(src)
188

189
#define X264_SCAN8_LUMA_SIZE (5*8)
Fiona Glaser's avatar
Fiona Glaser committed
190
#define X264_SCAN8_SIZE (X264_SCAN8_LUMA_SIZE*3)
191
192
#define X264_SCAN8_0 (4+1*8)

Fiona Glaser's avatar
Fiona Glaser committed
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
/* Scan8 organization:
 *    0 1 2 3 4 5 6 7
 * 0  DY    y y y y y
 * 1        y Y Y Y Y
 * 2        y Y Y Y Y
 * 3        y Y Y Y Y
 * 4        y Y Y Y Y
 * 5  DU    u u u u u
 * 6        u U U U U
 * 7        u U U U U
 * 8        u U U U U
 * 9        u U U U U
 * 10 DV    v v v v v
 * 11       v V V V V
 * 12       v V V V V
 * 13       v V V V V
 * 14       v V V V V
 * DY/DU/DV are for luma/chroma DC.
 */

#define LUMA_DC   48
#define CHROMA_DC 49

static const uint8_t x264_scan8[16*3 + 3] =
217
{
Fiona Glaser's avatar
Fiona Glaser committed
218
219
220
221
222
223
224
225
226
227
228
229
230
    4+ 1*8, 5+ 1*8, 4+ 2*8, 5+ 2*8,
    6+ 1*8, 7+ 1*8, 6+ 2*8, 7+ 2*8,
    4+ 3*8, 5+ 3*8, 4+ 4*8, 5+ 4*8,
    6+ 3*8, 7+ 3*8, 6+ 4*8, 7+ 4*8,
    4+ 6*8, 5+ 6*8, 4+ 7*8, 5+ 7*8,
    6+ 6*8, 7+ 6*8, 6+ 7*8, 7+ 7*8,
    4+ 8*8, 5+ 8*8, 4+ 9*8, 5+ 9*8,
    6+ 8*8, 7+ 8*8, 6+ 9*8, 7+ 9*8,
    4+11*8, 5+11*8, 4+12*8, 5+12*8,
    6+11*8, 7+11*8, 6+12*8, 7+12*8,
    4+13*8, 5+13*8, 4+14*8, 5+14*8,
    6+13*8, 7+13*8, 6+14*8, 7+14*8,
    0+ 0*8, 0+ 5*8, 0+10*8
231
232
};

233
#include "x264.h"
234
235
236
#if HAVE_OPENCL
#include "opencl.h"
#endif
237
#include "cabac.h"
238
#include "bitstream.h"
Laurent Aimar's avatar
Laurent Aimar committed
239
240
241
242
243
244
#include "set.h"
#include "predict.h"
#include "pixel.h"
#include "mc.h"
#include "frame.h"
#include "dct.h"
245
#include "quant.h"
246
#include "cpu.h"
247
#include "threadpool.h"
Laurent Aimar's avatar
Laurent Aimar committed
248

249
/****************************************************************************
250
 * General functions
251
 ****************************************************************************/
Laurent Aimar's avatar
Laurent Aimar committed
252
/* x264_malloc : will do or emulate a memalign
Loren Merritt's avatar
Loren Merritt committed
253
 * you have to use x264_free for buffers allocated with x264_malloc */
Laurent Aimar's avatar
Laurent Aimar committed
254
255
256
void *x264_malloc( int );
void  x264_free( void * );

257
258
259
/* x264_slurp_file: malloc space for the whole file and read it */
char *x264_slurp_file( const char *filename );

Laurent Aimar's avatar
Laurent Aimar committed
260
261
262
/* mdate: return the current date in microsecond */
int64_t x264_mdate( void );

263
264
265
266
/* x264_param2string: return a (malloced) string containing most of
 * the encoding options */
char *x264_param2string( x264_param_t *p, int b_res );

267
268
269
/* log */
void x264_log( x264_t *h, int i_level, const char *psz_fmt, ... );

270
void x264_reduce_fraction( uint32_t *n, uint32_t *d );
Fiona Glaser's avatar
Fiona Glaser committed
271
void x264_reduce_fraction64( uint64_t *n, uint64_t *d );
272
void x264_cavlc_init( x264_t *h );
Fiona Glaser's avatar
Fiona Glaser committed
273
void x264_cabac_init( x264_t *h );
Loren Merritt's avatar
Loren Merritt committed
274

275
static ALWAYS_INLINE pixel x264_clip_pixel( int x )
Loren Merritt's avatar
Loren Merritt committed
276
{
277
    return ( (x & ~PIXEL_MAX) ? (-x)>>31 & PIXEL_MAX : x );
Loren Merritt's avatar
Loren Merritt committed
278
279
}

280
static ALWAYS_INLINE int x264_clip3( int v, int i_min, int i_max )
Laurent Aimar's avatar
Laurent Aimar committed
281
{
Loren Merritt's avatar
Loren Merritt committed
282
    return ( (v < i_min) ? i_min : (v > i_max) ? i_max : v );
Laurent Aimar's avatar
Laurent Aimar committed
283
284
}

285
static ALWAYS_INLINE double x264_clip3f( double v, double f_min, double f_max )
Loren Merritt's avatar
Loren Merritt committed
286
287
288
{
    return ( (v < f_min) ? f_min : (v > f_max) ? f_max : v );
}
289

290
static ALWAYS_INLINE int x264_median( int a, int b, int c )
291
{
Loren Merritt's avatar
Loren Merritt committed
292
293
294
295
296
297
    int t = (a-b)&((a-b)>>31);
    a -= t;
    b += t;
    b -= (b-c)&((b-c)>>31);
    b += (a-b)&((a-b)>>31);
    return b;
298
299
}

300
static ALWAYS_INLINE void x264_median_mv( int16_t *dst, int16_t *a, int16_t *b, int16_t *c )
Loren Merritt's avatar
Loren Merritt committed
301
302
303
304
305
{
    dst[0] = x264_median( a[0], b[0], c[0] );
    dst[1] = x264_median( a[1], b[1], c[1] );
}

306
static ALWAYS_INLINE int x264_predictor_difference( int16_t (*mvc)[2], intptr_t i_mvc )
Fiona Glaser's avatar
Fiona Glaser committed
307
{
308
309
    int sum = 0;
    for( int i = 0; i < i_mvc-1; i++ )
Fiona Glaser's avatar
Fiona Glaser committed
310
311
312
313
314
315
316
    {
        sum += abs( mvc[i][0] - mvc[i+1][0] )
             + abs( mvc[i][1] - mvc[i+1][1] );
    }
    return sum;
}

317
static ALWAYS_INLINE uint16_t x264_cabac_mvd_sum( uint8_t *mvdleft, uint8_t *mvdtop )
Fiona Glaser's avatar
Fiona Glaser committed
318
{
319
320
    int amvd0 = mvdleft[0] + mvdtop[0];
    int amvd1 = mvdleft[1] + mvdtop[1];
Fiona Glaser's avatar
Fiona Glaser committed
321
322
    amvd0 = (amvd0 > 2) + (amvd0 > 32);
    amvd1 = (amvd1 > 2) + (amvd1 > 32);
323
    return amvd0 + (amvd1<<8);
Fiona Glaser's avatar
Fiona Glaser committed
324
325
}

326
327
328
extern const uint8_t x264_exp2_lut[64];
extern const float x264_log2_lut[128];
extern const float x264_log2_lz_lut[32];
Fiona Glaser's avatar
Fiona Glaser committed
329

Fiona Glaser's avatar
Fiona Glaser committed
330
331
/* Not a general-purpose function; multiplies input by -1/6 to convert
 * qp to qscale. */
Fiona Glaser's avatar
Fiona Glaser committed
332
333
static ALWAYS_INLINE int x264_exp2fix8( float x )
{
Anton Mitrofanov's avatar
Anton Mitrofanov committed
334
335
336
    int i = x*(-64.f/6.f) + 512.5f;
    if( i < 0 ) return 0;
    if( i > 1023 ) return 0xffff;
337
    return (x264_exp2_lut[i&63]+256) << (i>>6) >> 8;
Fiona Glaser's avatar
Fiona Glaser committed
338
339
340
341
342
}

static ALWAYS_INLINE float x264_log2( uint32_t x )
{
    int lz = x264_clz( x );
343
    return x264_log2_lut[(x<<lz>>24)&0x7f] + x264_log2_lz_lut[lz];
Fiona Glaser's avatar
Fiona Glaser committed
344
345
}

346
347
348
/****************************************************************************
 *
 ****************************************************************************/
Laurent Aimar's avatar
Laurent Aimar committed
349
350
351
352
353
354
355
enum slice_type_e
{
    SLICE_TYPE_P  = 0,
    SLICE_TYPE_B  = 1,
    SLICE_TYPE_I  = 2,
};

356
static const char slice_type_to_char[] = { 'P', 'B', 'I' };
Loren Merritt's avatar
Loren Merritt committed
357

358
359
360
361
362
363
364
365
366
enum sei_payload_type_e
{
    SEI_BUFFERING_PERIOD       = 0,
    SEI_PIC_TIMING             = 1,
    SEI_PAN_SCAN_RECT          = 2,
    SEI_FILLER                 = 3,
    SEI_USER_DATA_REGISTERED   = 4,
    SEI_USER_DATA_UNREGISTERED = 5,
    SEI_RECOVERY_POINT         = 6,
Fiona Glaser's avatar
Fiona Glaser committed
367
    SEI_DEC_REF_PIC_MARKING    = 7,
368
    SEI_FRAME_PACKING          = 45,
369
370
};

Laurent Aimar's avatar
Laurent Aimar committed
371
372
373
374
375
376
377
typedef struct
{
    x264_sps_t *sps;
    x264_pps_t *pps;

    int i_type;
    int i_first_mb;
Loren Merritt's avatar
Loren Merritt committed
378
    int i_last_mb;
Laurent Aimar's avatar
Laurent Aimar committed
379
380
381
382
383

    int i_pps_id;

    int i_frame_num;

384
    int b_mbaff;
Laurent Aimar's avatar
Laurent Aimar committed
385
386
387
388
389
    int b_field_pic;
    int b_bottom_field;

    int i_idr_pic_id;   /* -1 if nal_type != 5 */

390
    int i_poc;
Laurent Aimar's avatar
Laurent Aimar committed
391
392
393
394
395
396
397
398
399
400
401
    int i_delta_poc_bottom;

    int i_delta_poc[2];
    int i_redundant_pic_cnt;

    int b_direct_spatial_mv_pred;

    int b_num_ref_idx_override;
    int i_num_ref_idx_l0_active;
    int i_num_ref_idx_l1_active;

402
    int b_ref_pic_list_reordering[2];
Lamont Alston's avatar
Lamont Alston committed
403
404
    struct
    {
405
406
        int idc;
        int arg;
407
    } ref_pic_list_order[2][X264_REF_MAX];
408

Dylan Yudaken's avatar
Dylan Yudaken committed
409
    /* P-frame weighting */
410
    int b_weighted_pred;
411
    x264_weight_t weight[X264_REF_MAX*2][3];
Dylan Yudaken's avatar
Dylan Yudaken committed
412

Lamont Alston's avatar
Lamont Alston committed
413
414
415
416
417
418
    int i_mmco_remove_from_end;
    int i_mmco_command_count;
    struct /* struct for future expansion */
    {
        int i_difference_of_pic_nums;
        int i_poc;
419
    } mmco[X264_REF_MAX];
Lamont Alston's avatar
Lamont Alston committed
420

Laurent Aimar's avatar
Laurent Aimar committed
421
422
    int i_cabac_init_idc;

423
    int i_qp;
Laurent Aimar's avatar
Laurent Aimar committed
424
425
426
427
428
429
430
431
432
433
434
    int i_qp_delta;
    int b_sp_for_swidth;
    int i_qs_delta;

    /* deblocking filter */
    int i_disable_deblocking_filter_idc;
    int i_alpha_c0_offset;
    int i_beta_offset;

} x264_slice_header_t;

Steven Walters's avatar
Steven Walters committed
435
436
typedef struct x264_lookahead_t
{
437
    volatile uint8_t              b_exit_thread;
Steven Walters's avatar
Steven Walters committed
438
439
    uint8_t                       b_thread_active;
    uint8_t                       b_analyse_keyframe;
Fiona Glaser's avatar
Fiona Glaser committed
440
    int                           i_last_keyframe;
Steven Walters's avatar
Steven Walters committed
441
442
    int                           i_slicetype_length;
    x264_frame_t                  *last_nonb;
443
444
445
446
    x264_pthread_t                thread_handle;
    x264_sync_frame_list_t        ifbuf;
    x264_sync_frame_list_t        next;
    x264_sync_frame_list_t        ofbuf;
Steven Walters's avatar
Steven Walters committed
447
448
} x264_lookahead_t;

Laurent Aimar's avatar
Laurent Aimar committed
449
450
typedef struct x264_ratecontrol_t   x264_ratecontrol_t;

451
452
453
454
455
456
457
458
459
typedef struct x264_left_table_t
{
    uint8_t intra[4];
    uint8_t nnz[4];
    uint8_t nnz_chroma[4];
    uint8_t mv[4];
    uint8_t ref[4];
} x264_left_table_t;

460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
/* Current frame stats */
typedef struct
{
    /* MV bits (MV+Ref+Block Type) */
    int i_mv_bits;
    /* Texture bits (DCT coefs) */
    int i_tex_bits;
    /* ? */
    int i_misc_bits;
    /* MB type counts */
    int i_mb_count[19];
    int i_mb_count_i;
    int i_mb_count_p;
    int i_mb_count_skip;
    int i_mb_count_8x8dct[2];
    int i_mb_count_ref[2][X264_REF_MAX*2];
    int i_mb_partition[17];
    int i_mb_cbp[6];
    int i_mb_pred_mode[4][13];
    int i_mb_field[3];
    /* Adaptive direct mv pred */
    int i_direct_score[2];
    /* Metrics */
    int64_t i_ssd[3];
    double f_ssim;
    int i_ssim_cnt;
} x264_frame_stat_t;

Laurent Aimar's avatar
Laurent Aimar committed
488
489
490
491
492
struct x264_t
{
    /* encoder parameters */
    x264_param_t    param;

Steven Walters's avatar
Steven Walters committed
493
    x264_t          *thread[X264_THREAD_MAX+1];
Fiona Glaser's avatar
Fiona Glaser committed
494
    x264_t          *lookahead_thread[X264_LOOKAHEAD_THREAD_MAX];
Loren Merritt's avatar
Loren Merritt committed
495
496
    int             b_thread_active;
    int             i_thread_phase; /* which thread to use for the next frame */
497
    int             i_thread_idx;   /* which thread this is */
498
499
    int             i_threadslice_start; /* first row in this thread slice */
    int             i_threadslice_end; /* row after the end of this thread slice */
500
    int             i_threadslice_pass; /* which pass of encoding we are on */
501
    x264_threadpool_t *threadpool;
Fiona Glaser's avatar
Fiona Glaser committed
502
    x264_threadpool_t *lookaheadpool;
503
504
    x264_pthread_mutex_t mutex;
    x264_pthread_cond_t cv;
Loren Merritt's avatar
Loren Merritt committed
505

Laurent Aimar's avatar
Laurent Aimar committed
506
507
508
509
    /* bitstream output */
    struct
    {
        int         i_nal;
Fiona Glaser's avatar
Fiona Glaser committed
510
511
        int         i_nals_allocated;
        x264_nal_t  *nal;
Laurent Aimar's avatar
Laurent Aimar committed
512
513
514
515
516
        int         i_bitstream;    /* size of p_bitstream */
        uint8_t     *p_bitstream;   /* will hold data for all nal */
        bs_t        bs;
    } out;

517
518
519
    uint8_t *nal_buffer;
    int      nal_buffer_size;

520
521
522
    x264_t          *reconfig_h;
    int             reconfig;

Loren Merritt's avatar
Loren Merritt committed
523
524
    /**** thread synchronization starts here ****/

Laurent Aimar's avatar
Laurent Aimar committed
525
526
    /* frame number/poc */
    int             i_frame;
527
    int             i_frame_num;
Laurent Aimar's avatar
Laurent Aimar committed
528

529
530
531
532
    int             i_thread_frames; /* Number of different frames being encoded by threads;
                                      * 1 when sliced-threads is on. */
    int             i_nal_type;
    int             i_nal_ref_idc;
Loren Merritt's avatar
Loren Merritt committed
533

534
    int64_t         i_disp_fields;  /* Number of displayed fields (both coded and implied via pic_struct) */
535
    int             i_disp_fields_last_frame;
536
537
538
    int64_t         i_prev_duration; /* Duration of previous frame */
    int64_t         i_coded_fields; /* Number of coded fields (both coded and implied via pic_struct) */
    int64_t         i_cpb_delay;    /* Equal to number of fields preceding this field
539
                                     * since last buffering_period SEI */
540
541
    int64_t         i_coded_fields_lookahead; /* Use separate counters for lookahead */
    int64_t         i_cpb_delay_lookahead;
542

543
    int64_t         i_cpb_delay_pir_offset;
Kieran Kunhya's avatar
Kieran Kunhya committed
544
    int64_t         i_cpb_delay_pir_offset_next;
Kieran Kunhya's avatar
Kieran Kunhya committed
545

546
    int             b_queued_intra_refresh;
547
    int64_t         i_last_idr_pts;
548

Laurent Aimar's avatar
Laurent Aimar committed
549
550
    int             i_idr_pic_id;

Loren Merritt's avatar
Loren Merritt committed
551
552
    /* quantization matrix for decoding, [cqm][qp%6][coef] */
    int             (*dequant4_mf[4])[16];   /* [4][6][16] */
Fiona Glaser's avatar
Fiona Glaser committed
553
    int             (*dequant8_mf[4])[64];   /* [4][6][64] */
Loren Merritt's avatar
Loren Merritt committed
554
    /* quantization matrix for trellis, [cqm][qp][coef] */
555
556
    int             (*unquant4_mf[4])[16];   /* [4][QP_MAX_SPEC+1][16] */
    int             (*unquant8_mf[4])[64];   /* [4][QP_MAX_SPEC+1][64] */
Loren Merritt's avatar
Loren Merritt committed
557
    /* quantization matrix for deadzone */
558
559
560
561
562
563
    udctcoef        (*quant4_mf[4])[16];     /* [4][QP_MAX_SPEC+1][16] */
    udctcoef        (*quant8_mf[4])[64];     /* [4][QP_MAX_SPEC+1][64] */
    udctcoef        (*quant4_bias[4])[16];   /* [4][QP_MAX_SPEC+1][16] */
    udctcoef        (*quant8_bias[4])[64];   /* [4][QP_MAX_SPEC+1][64] */
    udctcoef        (*quant4_bias0[4])[16];  /* [4][QP_MAX_SPEC+1][16] */
    udctcoef        (*quant8_bias0[4])[64];  /* [4][QP_MAX_SPEC+1][64] */
Fiona Glaser's avatar
Fiona Glaser committed
564
    udctcoef        (*nr_offset_emergency)[4][64];
Loren Merritt's avatar
Loren Merritt committed
565

Fiona Glaser's avatar
Fiona Glaser committed
566
567
568
    /* mv/ref cost arrays. */
    uint16_t *cost_mv[QP_MAX+1];
    uint16_t *cost_mv_fpel[QP_MAX+1][4];
569

570
571
    const uint8_t   *chroma_qp_table; /* includes both the nonlinear luma->chroma mapping and chroma_qp_offset */

Laurent Aimar's avatar
Laurent Aimar committed
572
573
574
    /* Slice header */
    x264_slice_header_t sh;

575
576
577
578
    /* SPS / PPS */
    x264_sps_t      sps[1];
    x264_pps_t      pps[1];

Fiona Glaser's avatar
Fiona Glaser committed
579
580
581
582
    /* Slice header backup, for SEI_DEC_REF_PIC_MARKING */
    int b_sh_backup;
    x264_slice_header_t sh_backup;

Laurent Aimar's avatar
Laurent Aimar committed
583
584
585
586
587
    /* cabac context */
    x264_cabac_t    cabac;

    struct
    {
588
        /* Frames to be encoded (whose types have been decided) */
Steven Walters's avatar
Steven Walters committed
589
590
591
        x264_frame_t **current;
        /* Unused frames: 0 = fenc, 1 = fdec */
        x264_frame_t **unused[2];
Laurent Aimar's avatar
Laurent Aimar committed
592

Dylan Yudaken's avatar
Dylan Yudaken committed
593
594
595
        /* Unused blank frames (for duplicates) */
        x264_frame_t **blank_unused;

596
        /* frames used for reference + sentinels */
597
        x264_frame_t *reference[X264_REF_MAX+2];
Laurent Aimar's avatar
Laurent Aimar committed
598

Lamont Alston's avatar
Lamont Alston committed
599
600
601
602
603
        int i_last_keyframe;       /* Frame number of the last keyframe */
        int i_last_idr;            /* Frame number of the last IDR (not RP)*/
        int i_poc_last_open_gop;   /* Poc of the I frame of the last open-gop. The value
                                    * is only assigned during the period between that
                                    * I frame and the next P or I frame, else -1 */
604
605

        int i_input;    /* Number of input frames already accepted */
606
607
608
609

        int i_max_dpb;  /* Number of frames allocated in the decoded picture buffer */
        int i_max_ref0;
        int i_max_ref1;
610
        int i_delay;    /* Number of frames buffered for B reordering */
611
612
        int     i_bframe_delay;
        int64_t i_bframe_delay_time;
613
        int64_t i_first_pts;
Yusuke Nakamura's avatar
Yusuke Nakamura committed
614
        int64_t i_prev_reordered_pts[2];
615
616
        int64_t i_largest_pts;
        int64_t i_second_largest_pts;
617
        int b_have_lowres;  /* Whether 1/2 resolution luma planes are being used */
Loren Merritt's avatar
Loren Merritt committed
618
        int b_have_sub8x8_esa;
Laurent Aimar's avatar
Laurent Aimar committed
619
620
621
622
623
624
625
626
627
    } frames;

    /* current frame being encoded */
    x264_frame_t    *fenc;

    /* frame being reconstructed */
    x264_frame_t    *fdec;

    /* references lists */
628
629
    int             i_ref[2];
    x264_frame_t    *fref[2][X264_REF_MAX+3];
630
    x264_frame_t    *fref_nearest[2];
631
    int             b_ref_reorder[2];
Laurent Aimar's avatar
Laurent Aimar committed
632

633
634
    /* hrd */
    int initial_cpb_removal_delay;
Kieran Kunhya's avatar
Kieran Kunhya committed
635
    int initial_cpb_removal_delay_offset;
636
    int64_t i_reordered_pts_delay;
Laurent Aimar's avatar
Laurent Aimar committed
637
638
639
640

    /* Current MB DCT coeffs */
    struct
    {
641
        ALIGNED_N( dctcoef luma16x16_dc[3][16] );
Henrik Gramner's avatar
Henrik Gramner committed
642
        ALIGNED_16( dctcoef chroma_dc[2][8] );
643
        // FIXME share memory?
644
645
        ALIGNED_N( dctcoef luma8x8[12][64] );
        ALIGNED_N( dctcoef luma4x4[16*3][16] );
Laurent Aimar's avatar
Laurent Aimar committed
646
647
648
649
650
    } dct;

    /* MB table and cache for current frame/mb */
    struct
    {
651
652
        int     i_mb_width;
        int     i_mb_height;
653
654
        int     i_mb_count;                 /* number of mbs in a frame */

Henrik Gramner's avatar
Henrik Gramner committed
655
656
657
658
        /* Chroma subsampling */
        int     chroma_h_shift;
        int     chroma_v_shift;

Laurent Aimar's avatar
Laurent Aimar committed
659
660
        /* Strides */
        int     i_mb_stride;
661
662
        int     i_b8_stride;
        int     i_b4_stride;
Simon Horlick's avatar
Simon Horlick committed
663
664
        int     left_b8[2];
        int     left_b4[2];
Laurent Aimar's avatar
Laurent Aimar committed
665
666
667
668
669

        /* Current index */
        int     i_mb_x;
        int     i_mb_y;
        int     i_mb_xy;
670
671
        int     i_b8_xy;
        int     i_b4_xy;
Loren Merritt's avatar
Loren Merritt committed
672

673
        /* Search parameters */
Loren Merritt's avatar
Loren Merritt committed
674
        int     i_me_method;
675
        int     i_subpel_refine;
Loren Merritt's avatar
Loren Merritt committed
676
        int     b_chroma_me;
Loren Merritt's avatar
Loren Merritt committed
677
        int     b_trellis;
678
        int     b_noise_reduction;
679
        int     b_dct_decimate;
680
681
        int     i_psy_rd; /* Psy RD strength--fixed point value*/
        int     i_psy_trellis; /* Psy trellis strength--fixed point value*/
682

683
        int     b_interlaced;
684
        int     b_adaptive_mbaff; /* MBAFF+subme 0 requires non-adaptive MBAFF i.e. all field mbs */
685

686
        /* Allowed qpel MV range to stay within the picture + emulated edge pixels */
687
688
        int     mv_min[2];
        int     mv_max[2];
Simon Horlick's avatar
Simon Horlick committed
689
690
        int     mv_miny_row[3]; /* 0 == top progressive, 1 == bot progressive, 2 == interlaced */
        int     mv_maxy_row[3];
691
692
693
694
        /* Subpel MV range for motion search.
         * same mv_min/max but includes levels' i_mv_range. */
        int     mv_min_spel[2];
        int     mv_max_spel[2];
Simon Horlick's avatar
Simon Horlick committed
695
696
        int     mv_miny_spel_row[3];
        int     mv_maxy_spel_row[3];
697
        /* Fullpel MV range for motion search */
698
        ALIGNED_8( int16_t mv_limit_fpel[2][2] ); /* min_x, min_y, max_x, max_y */
Simon Horlick's avatar
Simon Horlick committed
699
700
        int     mv_miny_fpel_row[3];
        int     mv_maxy_fpel_row[3];
701

Loren Merritt's avatar
Loren Merritt committed
702
        /* neighboring MBs */
Laurent Aimar's avatar
Laurent Aimar committed
703
        unsigned int i_neighbour;
704
705
        unsigned int i_neighbour8[4];       /* neighbours of each 8x8 or 4x4 block that are available */
        unsigned int i_neighbour4[16];      /* at the time the block is coded */
706
        unsigned int i_neighbour_intra;     /* for constrained intra pred */
707
        unsigned int i_neighbour_frame;     /* ignoring slice boundaries */
Loren Merritt's avatar
Loren Merritt committed
708
        int     i_mb_type_top;
709
        int     i_mb_type_left[2];
Loren Merritt's avatar
Loren Merritt committed
710
711
        int     i_mb_type_topleft;
        int     i_mb_type_topright;
712
        int     i_mb_prev_xy;
713
        int     i_mb_left_xy[2];
714
        int     i_mb_top_xy;
715
716
        int     i_mb_topleft_xy;
        int     i_mb_topright_xy;
Simon Horlick's avatar
Simon Horlick committed
717
718
719
        int     i_mb_top_y;
        int     i_mb_topleft_y;
        int     i_mb_topright_y;
Fiona Glaser's avatar
Fiona Glaser committed
720
        const x264_left_table_t *left_index_table;
721
        int     i_mb_top_mbpair_xy;
Simon Horlick's avatar
Simon Horlick committed
722
        int     topleft_partition;
723
        int     b_allow_skip;
724
        int     field_decoding_flag;
Laurent Aimar's avatar
Laurent Aimar committed
725

Loren Merritt's avatar
Loren Merritt committed
726
        /**** thread synchronization ends here ****/
Loren Merritt's avatar
Loren Merritt committed
727
        /* subsequent variables are either thread-local or constant,
Loren Merritt's avatar
Loren Merritt committed
728
729
         * and won't be copied from one thread to another */

Laurent Aimar's avatar
Laurent Aimar committed
730
        /* mb table */
Henrik Gramner's avatar
Henrik Gramner committed
731
        uint8_t *base;                      /* base pointer for all malloced data in this mb */
Laurent Aimar's avatar
Laurent Aimar committed
732
        int8_t  *type;                      /* mb type */
733
        uint8_t *partition;                 /* mb partition */
Laurent Aimar's avatar
Laurent Aimar committed
734
735
        int8_t  *qp;                        /* mb qp */
        int16_t *cbp;                       /* mb cbp: 0x0?: luma, 0x?0: chroma, 0x100: luma dc, 0x0200 and 0x0400: chroma dc  (all set for PCM)*/
736
737
        int8_t  (*intra4x4_pred_mode)[8];   /* intra4x4 pred mode. for non I4x4 set to I_PRED_4x4_DC(2) */
                                            /* actually has only 7 entries; set to 8 for write-combining optimizations */
Fiona Glaser's avatar
Fiona Glaser committed
738
        uint8_t (*non_zero_count)[16*3];    /* nzc. for I_PCM set to 16 */
Laurent Aimar's avatar
Laurent Aimar committed
739
740
        int8_t  *chroma_pred_mode;          /* chroma_pred_mode. cabac only. for non intra I_PRED_CHROMA_DC(0) */
        int16_t (*mv[2])[2];                /* mb mv. set to 0 for intra mb */
Henrik Gramner's avatar
Henrik Gramner committed
741
        uint8_t (*mvd[2])[8][2];            /* absolute value of mb mv difference with predict, clipped to [0,33]. set to 0 if intra. cabac only */
742
        int8_t   *ref[2];                   /* mb ref. set to -1 if non used (intra or Lx only) */
743
        int16_t (*mvr[2][X264_REF_MAX*2])[2];/* 16x16 mv for each possible ref */
744
        int8_t  *skipbp;                    /* block pattern for SKIP or DIRECT (sub)mbs. B-frames + cabac only */
745
        int8_t  *mb_transform_size;         /* transform_size_8x8_flag of each mb */
746
747
        uint16_t *slice_table;              /* sh->first_mb of the slice that the indexed mb is part of
                                             * NOTE: this will fail on resolutions above 2^16 MBs... */
748
        uint8_t *field;
749

Dylan Yudaken's avatar
Dylan Yudaken committed
750
         /* buffer for weighted versions of the reference frames */
751
        pixel *p_weight_buf[X264_REF_MAX];
Dylan Yudaken's avatar
Dylan Yudaken committed
752

Laurent Aimar's avatar
Laurent Aimar committed
753
754
755
        /* current value */
        int     i_type;
        int     i_partition;
756
        ALIGNED_4( uint8_t i_sub_partition[4] );
757
        int     b_transform_8x8;
Laurent Aimar's avatar
Laurent Aimar committed
758
759
760
761
762
763
764

        int     i_cbp_luma;
        int     i_cbp_chroma;

        int     i_intra16x16_pred_mode;
        int     i_chroma_pred_mode;

765
766
767
768
769
        /* skip flags for i4x4 and i8x8
         * 0 = encode as normal.
         * 1 (non-RD only) = the DCT is still in h->dct, restore fdec and skip reconstruction.
         * 2 (RD only) = the DCT has since been overwritten by RD; restore that too. */
        int i_skip_intra;
Fiona Glaser's avatar
Fiona Glaser committed
770
771
        /* skip flag for motion compensation */
        /* if we've already done MC, we don't need to do it again */
772
        int b_skip_mc;
Fiona Glaser's avatar
Fiona Glaser committed
773
774
        /* set to true if we are re-encoding a macroblock. */
        int b_reencode_mb;
Fiona Glaser's avatar
Fiona Glaser committed
775
        int ip_offset; /* Used by PIR to offset the quantizer of intra-refresh blocks. */
Fiona Glaser's avatar
Fiona Glaser committed
776
        int b_deblock_rdo;
777
        int b_overflow; /* If CAVLC had a level code overflow during bitstream writing. */
778

Laurent Aimar's avatar
Laurent Aimar committed
779
780
        struct
        {
781
782
783
            /* space for p_fenc and p_fdec */
#define FENC_STRIDE 16
#define FDEC_STRIDE 32
Fiona Glaser's avatar
Fiona Glaser committed
784
            ALIGNED_16( pixel fenc_buf[48*FENC_STRIDE] );
785
            ALIGNED_N( pixel fdec_buf[52*FDEC_STRIDE] );
786

Loren Merritt's avatar
Loren Merritt committed
787
            /* i4x4 and i8x8 backup data, for skipping the encode stage when possible */
788
789
            ALIGNED_16( pixel i4x4_fdec_buf[16*16] );
            ALIGNED_16( pixel i8x8_fdec_buf[16*16] );
790
791
            ALIGNED_16( dctcoef i8x8_dct_buf[3][64] );
            ALIGNED_16( dctcoef i4x4_dct_buf[15][16] );
792
793
794
795
            uint32_t i4x4_nnz_buf[4];
            uint32_t i8x8_nnz_buf[4];
            int i4x4_cbp;
            int i8x8_cbp;
796

797
            /* Psy trellis DCT data */
798
799
            ALIGNED_16( dctcoef fenc_dct8[4][64] );
            ALIGNED_16( dctcoef fenc_dct4[16][16] );
800

801
            /* Psy RD SATD/SA8D scores cache */
Henrik Gramner's avatar
Henrik Gramner committed
802
803
            ALIGNED_N( uint64_t fenc_hadamard_cache[9] );
            ALIGNED_N( uint32_t fenc_satd_cache[32] );
804

Laurent Aimar's avatar
Laurent Aimar committed
805
            /* pointer over mb of the frame to be compressed */
806
            pixel *p_fenc[3]; /* y,u,v */
807
            /* pointer to the actual source frame, not a block copy */
Fiona Glaser's avatar
Fiona Glaser committed
808
            pixel *p_fenc_plane[3];
Laurent Aimar's avatar
Laurent Aimar committed
809

Loren Merritt's avatar
Loren Merritt committed
810
            /* pointer over mb of the frame to be reconstructed  */
811
            pixel *p_fdec[3];
Laurent Aimar's avatar
Laurent Aimar committed
812
813

            /* pointer over mb of the references */
814
            int i_fref[2];
Fiona Glaser's avatar
Fiona Glaser committed
815
816
            /* [12]: yN, yH, yV, yHV, (NV12 ? uv : I444 ? (uN, uH, uV, uHV, vN, ...)) */
            pixel *p_fref[2][X264_REF_MAX*2][12];
817
818
            pixel *p_fref_w[X264_REF_MAX*2];  /* weighted fullpel luma */
            uint16_t *p_integral[2][X264_REF_MAX];
Laurent Aimar's avatar
Laurent Aimar committed
819

820
            /* fref stride */
Laurent Aimar's avatar
Laurent Aimar committed
821
822
823
824
825
826
            int     i_stride[3];
        } pic;

        /* cache */
        struct
        {
827
            /* real intra4x4_pred_mode if I_4X4 or I_8X8, I_PRED_4x4_DC if mb available, -1 if not */
Fiona Glaser's avatar
Fiona Glaser committed
828
            ALIGNED_8( int8_t intra4x4_pred_mode[X264_SCAN8_LUMA_SIZE] );
Laurent Aimar's avatar
Laurent Aimar committed
829

Loren Merritt's avatar
Loren Merritt committed
830
            /* i_non_zero_count if available else 0x80 */
Henrik Gramner's avatar
Henrik Gramner committed
831
            ALIGNED_16( uint8_t non_zero_count[X264_SCAN8_SIZE] );
Laurent Aimar's avatar
Laurent Aimar committed
832

Loren Merritt's avatar
Loren Merritt committed
833
            /* -1 if unused, -2 if unavailable */
Fiona Glaser's avatar
Fiona Glaser committed
834
            ALIGNED_4( int8_t ref[2][X264_SCAN8_LUMA_SIZE] );
Laurent Aimar's avatar
Laurent Aimar committed
835

Loren Merritt's avatar
Loren Merritt committed
836
            /* 0 if not available */
Fiona Glaser's avatar
Fiona Glaser committed
837
838
            ALIGNED_16( int16_t mv[2][X264_SCAN8_LUMA_SIZE][2] );
            ALIGNED_8( uint8_t mvd[2][X264_SCAN8_LUMA_SIZE][2] );
839
840

            /* 1 if SKIP or DIRECT. set only for B-frames + CABAC */
Fiona Glaser's avatar
Fiona Glaser committed
841
            ALIGNED_4( int8_t skip[X264_SCAN8_LUMA_SIZE] );
842

843
844
            ALIGNED_4( int16_t direct_mv[2][4][2] );
            ALIGNED_4( int8_t  direct_ref[2][4] );
845
            int     direct_partition;
846
            ALIGNED_4( int16_t pskip_mv[2] );
847

848
849
            /* number of neighbors (top and left) that used 8x8 dct */
            int     i_neighbour_transform_size;
Simon Horlick's avatar
Simon Horlick committed
850
            int     i_neighbour_skip;
851
852
853
854

            /* neighbor CBPs */
            int     i_cbp_top;
            int     i_cbp_left;
Simon Horlick's avatar
Simon Horlick committed
855
856
857
858

            /* extra data required for mbaff in mv prediction */
            int16_t topright_mv[2][3][2];
            int8_t  topright_ref[2][3];
859
860
861

            /* current mb deblock strength */
            uint8_t (*deblock_strength)[8][4];
Laurent Aimar's avatar
Laurent Aimar committed
862
863
864
        } cache;

        /* */
865
        int     i_qp;       /* current qp */
866
        int     i_chroma_qp;
Laurent Aimar's avatar
Laurent Aimar committed
867
868
        int     i_last_qp;  /* last qp */
        int     i_last_dqp; /* last delta qp */
869
        int     b_variable_qp; /* whether qp is allowed to vary per macroblock */
Loren Merritt's avatar
Loren Merritt committed
870
        int     b_lossless;
Loren Merritt's avatar
Loren Merritt committed
871
872
        int     b_direct_auto_read; /* take stats for --direct auto from the 2pass log */
        int     b_direct_auto_write; /* analyse direct modes, to use and/or save */
Laurent Aimar's avatar
Laurent Aimar committed
873

Fiona Glaser's avatar
Fiona Glaser committed
874
875
876
877
878
        /* lambda values */
        int     i_trellis_lambda2[2][2]; /* [luma,chroma][inter,intra] */
        int     i_psy_rd_lambda;
        int     i_chroma_lambda2_offset;

879
        /* B_direct and weighted prediction */
Simon Horlick's avatar
Simon Horlick committed
880
        int16_t dist_scale_factor_buf[2][2][X264_REF_MAX*2][4];
881
        int16_t (*dist_scale_factor)[4];
Simon Horlick's avatar
Simon Horlick committed
882
        int8_t bipred_weight_buf[2][2][X264_REF_MAX*2][4];
883
        int8_t (*bipred_weight)[4];
884
        /* maps fref1[0]'s ref indices into the current list0 */
885
#define map_col_to_list0(col) h->mb.map_col_to_list0[(col)+2]
886
        int8_t  map_col_to_list0[X264_REF_MAX+2];
Fiona Glaser's avatar
Fiona Glaser committed
887
        int ref_blind_dupe; /* The index of the blind reference frame duplicate. */
888
        int8_t deblock_ref_table[X264_REF_MAX*2+2];
Fiona Glaser's avatar
Fiona Glaser committed
889
#define deblock_ref_table(x) h->mb.deblock_ref_table[(x)+2]
Laurent Aimar's avatar
Laurent Aimar committed
890
891
892
893
894
895
896
897
    } mb;

    /* rate control encoding only */
    x264_ratecontrol_t *rc;

    /* stats */
    struct
    {
898
        /* Current frame stats */
899
        x264_frame_stat_t frame;
900

Loren Merritt's avatar
Loren Merritt committed
901
        /* Cumulated stats */
902

Laurent Aimar's avatar
Laurent Aimar committed
903
        /* per slice info */
Fiona Glaser's avatar
Fiona Glaser committed
904
905
906
        int     i_frame_count[3];
        int64_t i_frame_size[3];
        double  f_frame_qp[3];
907
        int     i_consecutive_bframes[X264_BFRAME_MAX+1];
908
        /* */
Fiona Glaser's avatar
Fiona Glaser committed
909
910
911
912
913
914
915
        double  f_ssd_global[3];
        double  f_psnr_average[3];
        double  f_psnr_mean_y[3];
        double  f_psnr_mean_u[3];
        double  f_psnr_mean_v[3];
        double  f_ssim_mean_y[3];
        double  f_frame_duration[3];
916
        /* */
Fiona Glaser's avatar
Fiona Glaser committed
917
        int64_t i_mb_count[3][19];
918
        int64_t i_mb_partition[2][17];
919
        int64_t i_mb_count_8x8dct[2];
920
        int64_t i_mb_count_ref[2][2][X264_REF_MAX*2];
921
        int64_t i_mb_cbp[6];
922
        int64_t i_mb_pred_mode[4][13];
Fiona Glaser's avatar
Fiona Glaser committed
923
        int64_t i_mb_field[3];
Loren Merritt's avatar
Loren Merritt committed
924
925
926
        /* */
        int     i_direct_score[2];
        int     i_direct_frames[2];
Dylan Yudaken's avatar
Dylan Yudaken committed
927
        /* num p-frames weighted */
Fiona Glaser's avatar
Fiona Glaser committed
928
        int     i_wpred[2];
929

Laurent Aimar's avatar
Laurent Aimar committed
930
931
    } stat;

Fiona Glaser's avatar
Fiona Glaser committed
932
    /* 0 = luma 4x4, 1 = luma 8x8, 2 = chroma 4x4, 3 = chroma 8x8 */
Fiona Glaser's avatar
Fiona Glaser committed
933
934
935
936
    udctcoef (*nr_offset)[64];
    uint32_t (*nr_residual_sum)[64];
    uint32_t *nr_count;

937
938
    ALIGNED_N( udctcoef nr_offset_denoise[4][64] );
    ALIGNED_N( uint32_t nr_residual_sum_buf[2][4][64] );
Fiona Glaser's avatar
Fiona Glaser committed
939
    uint32_t nr_count_buf[2][4];
Anton Mitrofanov's avatar
Anton Mitrofanov committed
940

Henrik Gramner's avatar
Henrik Gramner committed
941
942
    uint8_t luma2chroma_pixel[7]; /* Subsampled pixel size */

943
    /* Buffers that are allocated per-thread even in sliced threads. */
944
    void *scratch_buffer; /* for any temporary storage that doesn't want repeated malloc */
Fiona Glaser's avatar
Fiona Glaser committed
945
    void *scratch_buffer2; /* if the first one's already in use */
Fiona Glaser's avatar
Fiona Glaser committed
946
    pixel *intra_border_backup[5][3]; /* bottom pixels of the previous mb row, used for intra prediction after the framebuffer has been deblocked */
947
948
949
    /* Deblock strength values are stored for each 4x4 partition. In MBAFF
     * there are four extra values that need to be stored, located in [4][i]. */
    uint8_t (*deblock_strength[2])[2][8][4];
950

Loren Merritt's avatar
Loren Merritt committed
951
    /* CPU functions dependents */
Laurent Aimar's avatar
Laurent Aimar committed
952
    x264_predict_t      predict_16x16[4+3];
953
    x264_predict8x8_t   predict_8x8[9+3];
Laurent Aimar's avatar
Laurent Aimar committed
954
    x264_predict_t      predict_4x4[9+3];
Henrik Gramner's avatar
Henrik Gramner committed
955
956
957
    x264_predict_t      predict_chroma[4+3];
    x264_predict_t      predict_8x8c[4+3];
    x264_predict_t      predict_8x16c[4+3];
958
    x264_predict_8x8_filter_t predict_8x8_filter;
Laurent Aimar's avatar
Laurent Aimar committed
959
960

    x264_pixel_function_t pixf;
961
    x264_mc_functions_t   mc;
Laurent Aimar's avatar
Laurent Aimar committed
962
    x264_dct_function_t   dctf;
963
    x264_zigzag_function_t zigzagf;
964
965
    x264_zigzag_function_t zigzagf_interlaced;
    x264_zigzag_function_t zigzagf_progressive;
966
    x264_quant_function_t quantf;
Loren Merritt's avatar
Loren Merritt committed
967
    x264_deblock_function_t loopf;