Statistics
| Branch: | Revision:

ffmpeg / libswscale / swscale_internal.h @ a959e247

History | View | Annotate | Download (14.9 KB)

1
/*
2
 * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
3
 *
4
 * This file is part of FFmpeg.
5
 *
6
 * FFmpeg is free software; you can redistribute it and/or
7
 * modify it under the terms of the GNU Lesser General Public
8
 * License as published by the Free Software Foundation; either
9
 * version 2.1 of the License, or (at your option) any later version.
10
 *
11
 * FFmpeg is distributed in the hope that it will be useful,
12
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14
 * Lesser General Public License for more details.
15
 *
16
 * You should have received a copy of the GNU Lesser General Public
17
 * License along with FFmpeg; if not, write to the Free Software
18
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19
 */
20

    
21
#ifndef SWSCALE_SWSCALE_INTERNAL_H
22
#define SWSCALE_SWSCALE_INTERNAL_H
23

    
24
#include "config.h"
25

    
26
#if HAVE_ALTIVEC_H
27
#include <altivec.h>
28
#endif
29

    
30
#include "libavutil/avutil.h"
31

    
32
#define STR(s)         AV_TOSTRING(s) //AV_STRINGIFY is too long
33

    
34
#define MAX_FILTER_SIZE 256
35

    
36
#if ARCH_X86
37
#define VOFW 5120
38
#else
39
#define VOFW 2048 // faster on PPC and not tested on others
40
#endif
41

    
42
#define VOF  (VOFW*2)
43

    
44
#if HAVE_BIGENDIAN
45
#define ALT32_CORR (-1)
46
#else
47
#define ALT32_CORR   1
48
#endif
49

    
50
#if ARCH_X86_64
51
#   define APCK_PTR2 8
52
#   define APCK_COEF 16
53
#   define APCK_SIZE 24
54
#else
55
#   define APCK_PTR2 4
56
#   define APCK_COEF 8
57
#   define APCK_SIZE 16
58
#endif
59

    
60
struct SwsContext;
61

    
62
typedef int (*SwsFunc)(struct SwsContext *context, const uint8_t* src[],
63
                       int srcStride[], int srcSliceY, int srcSliceH,
64
                       uint8_t* dst[], int dstStride[]);
65

    
66
/* This struct should be aligned on at least a 32-byte boundary. */
67
typedef struct SwsContext {
68
    /**
69
     * info on struct for av_log
70
     */
71
    const AVClass *av_class;
72

    
73
    /**
74
     * Note that src, dst, srcStride, dstStride will be copied in the
75
     * sws_scale() wrapper so they can be freely modified here.
76
     */
77
    SwsFunc swScale;
78
    int srcW, srcH, dstH;
79
    int chrSrcW, chrSrcH, chrDstW, chrDstH;
80
    int lumXInc, chrXInc;
81
    int lumYInc, chrYInc;
82
    enum PixelFormat dstFormat, srcFormat;  ///< format 4:2:0 type is always YV12
83
    int chrSrcHSubSample, chrSrcVSubSample;
84
    int chrDstHSubSample, chrDstVSubSample;
85
    int vChrDrop;
86
    int sliceDir;
87
    double param[2];
88

    
89
    uint32_t pal_yuv[256];
90
    uint32_t pal_rgb[256];
91

    
92
    int16_t **lumPixBuf;
93
    int16_t **chrPixBuf;
94
    int16_t **alpPixBuf;
95
    int16_t *hLumFilter;
96
    int16_t *hLumFilterPos;
97
    int16_t *hChrFilter;
98
    int16_t *hChrFilterPos;
99
    int16_t *vLumFilter;
100
    int16_t *vLumFilterPos;
101
    int16_t *vChrFilter;
102
    int16_t *vChrFilterPos;
103

    
104
    uint8_t formatConvBuffer[VOF]; //FIXME dynamic allocation, but we have to change a lot of code for this to be useful
105

    
106
    int hLumFilterSize;
107
    int hChrFilterSize;
108
    int vLumFilterSize;
109
    int vChrFilterSize;
110
    int vLumBufSize;
111
    int vChrBufSize;
112

    
113
    int lumMmx2FilterCodeSize;
114
    int chrMmx2FilterCodeSize;
115
    uint8_t *lumMmx2FilterCode;
116
    uint8_t *chrMmx2FilterCode;
117
    int32_t *lumMmx2FilterPos;
118
    int32_t *chrMmx2FilterPos;
119
    int16_t *lumMmx2Filter;
120
    int16_t *chrMmx2Filter;
121

    
122
    int canMMX2BeUsed;
123

    
124
    int lastInLumBuf;
125
    int lastInChrBuf;
126
    int lumBufIndex;
127
    int chrBufIndex;
128
    int dstY;
129
    int flags;
130
    void * yuvTable;            // pointer to the yuv->rgb table start so it can be freed()
131
    uint8_t * table_rV[256];
132
    uint8_t * table_gU[256];
133
    int    table_gV[256];
134
    uint8_t * table_bU[256];
135

    
136
    //Colorspace stuff
137
    int contrast, brightness, saturation;    // for sws_getColorspaceDetails
138
    int srcColorspaceTable[4];
139
    int dstColorspaceTable[4];
140
    int srcRange, dstRange;
141
    int yuv2rgb_y_offset;
142
    int yuv2rgb_y_coeff;
143
    int yuv2rgb_v2r_coeff;
144
    int yuv2rgb_v2g_coeff;
145
    int yuv2rgb_u2g_coeff;
146
    int yuv2rgb_u2b_coeff;
147

    
148
#define RED_DITHER            "0*8"
149
#define GREEN_DITHER          "1*8"
150
#define BLUE_DITHER           "2*8"
151
#define Y_COEFF               "3*8"
152
#define VR_COEFF              "4*8"
153
#define UB_COEFF              "5*8"
154
#define VG_COEFF              "6*8"
155
#define UG_COEFF              "7*8"
156
#define Y_OFFSET              "8*8"
157
#define U_OFFSET              "9*8"
158
#define V_OFFSET              "10*8"
159
#define LUM_MMX_FILTER_OFFSET "11*8"
160
#define CHR_MMX_FILTER_OFFSET "11*8+4*4*256"
161
#define DSTW_OFFSET           "11*8+4*4*256*2" //do not change, it is hardcoded in the ASM
162
#define ESP_OFFSET            "11*8+4*4*256*2+8"
163
#define VROUNDER_OFFSET       "11*8+4*4*256*2+16"
164
#define U_TEMP                "11*8+4*4*256*2+24"
165
#define V_TEMP                "11*8+4*4*256*2+32"
166
#define Y_TEMP                "11*8+4*4*256*2+40"
167
#define ALP_MMX_FILTER_OFFSET "11*8+4*4*256*2+48"
168

    
169
    DECLARE_ALIGNED(8, uint64_t, redDither);
170
    DECLARE_ALIGNED(8, uint64_t, greenDither);
171
    DECLARE_ALIGNED(8, uint64_t, blueDither);
172

    
173
    DECLARE_ALIGNED(8, uint64_t, yCoeff);
174
    DECLARE_ALIGNED(8, uint64_t, vrCoeff);
175
    DECLARE_ALIGNED(8, uint64_t, ubCoeff);
176
    DECLARE_ALIGNED(8, uint64_t, vgCoeff);
177
    DECLARE_ALIGNED(8, uint64_t, ugCoeff);
178
    DECLARE_ALIGNED(8, uint64_t, yOffset);
179
    DECLARE_ALIGNED(8, uint64_t, uOffset);
180
    DECLARE_ALIGNED(8, uint64_t, vOffset);
181
    int32_t  lumMmxFilter[4*MAX_FILTER_SIZE];
182
    int32_t  chrMmxFilter[4*MAX_FILTER_SIZE];
183
    int dstW;
184
    DECLARE_ALIGNED(8, uint64_t, esp);
185
    DECLARE_ALIGNED(8, uint64_t, vRounder);
186
    DECLARE_ALIGNED(8, uint64_t, u_temp);
187
    DECLARE_ALIGNED(8, uint64_t, v_temp);
188
    DECLARE_ALIGNED(8, uint64_t, y_temp);
189
    int32_t  alpMmxFilter[4*MAX_FILTER_SIZE];
190

    
191
#if HAVE_ALTIVEC
192
    vector signed short   CY;
193
    vector signed short   CRV;
194
    vector signed short   CBU;
195
    vector signed short   CGU;
196
    vector signed short   CGV;
197
    vector signed short   OY;
198
    vector unsigned short CSHIFT;
199
    vector signed short   *vYCoeffsBank, *vCCoeffsBank;
200
#endif
201

    
202
#if ARCH_BFIN
203
    DECLARE_ALIGNED(4, uint32_t, oy);
204
    DECLARE_ALIGNED(4, uint32_t, oc);
205
    DECLARE_ALIGNED(4, uint32_t, zero);
206
    DECLARE_ALIGNED(4, uint32_t, cy);
207
    DECLARE_ALIGNED(4, uint32_t, crv);
208
    DECLARE_ALIGNED(4, uint32_t, rmask);
209
    DECLARE_ALIGNED(4, uint32_t, cbu);
210
    DECLARE_ALIGNED(4, uint32_t, bmask);
211
    DECLARE_ALIGNED(4, uint32_t, cgu);
212
    DECLARE_ALIGNED(4, uint32_t, cgv);
213
    DECLARE_ALIGNED(4, uint32_t, gmask);
214
#endif
215

    
216
#if HAVE_VIS
217
    DECLARE_ALIGNED(8, uint64_t, sparc_coeffs[10]);
218
#endif
219

    
220
    /* function pointers for swScale() */
221
    void (*yuv2nv12X  )(struct SwsContext *c,
222
                        const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
223
                        const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
224
                        uint8_t *dest, uint8_t *uDest,
225
                        int dstW, int chrDstW, int dstFormat);
226
    void (*yuv2yuv1   )(struct SwsContext *c,
227
                        const int16_t *lumSrc, const int16_t *chrSrc, const int16_t *alpSrc,
228
                        uint8_t *dest,
229
                        uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
230
                        long dstW, long chrDstW);
231
    void (*yuv2yuvX   )(struct SwsContext *c,
232
                        const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
233
                        const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
234
                        const int16_t **alpSrc,
235
                        uint8_t *dest,
236
                        uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
237
                        long dstW, long chrDstW);
238
    void (*yuv2packed1)(struct SwsContext *c,
239
                        const uint16_t *buf0,
240
                        const uint16_t *uvbuf0, const uint16_t *uvbuf1,
241
                        const uint16_t *abuf0,
242
                        uint8_t *dest,
243
                        int dstW, int uvalpha, int dstFormat, int flags, int y);
244
    void (*yuv2packed2)(struct SwsContext *c,
245
                        const uint16_t *buf0, const uint16_t *buf1,
246
                        const uint16_t *uvbuf0, const uint16_t *uvbuf1,
247
                        const uint16_t *abuf0, const uint16_t *abuf1,
248
                        uint8_t *dest,
249
                        int dstW, int yalpha, int uvalpha, int y);
250
    void (*yuv2packedX)(struct SwsContext *c,
251
                        const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
252
                        const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
253
                        const int16_t **alpSrc, uint8_t *dest,
254
                        long dstW, long dstY);
255

    
256
    void (*lumToYV12)(uint8_t *dst, const uint8_t *src,
257
                      long width, uint32_t *pal); ///< Unscaled conversion of luma plane to YV12 for horizontal scaler.
258
    void (*alpToYV12)(uint8_t *dst, const uint8_t *src,
259
                      long width, uint32_t *pal); ///< Unscaled conversion of alpha plane to YV12 for horizontal scaler.
260
    void (*chrToYV12)(uint8_t *dstU, uint8_t *dstV,
261
                      const uint8_t *src1, const uint8_t *src2,
262
                      long width, uint32_t *pal); ///< Unscaled conversion of chroma planes to YV12 for horizontal scaler.
263
    void (*hyscale_fast)(struct SwsContext *c,
264
                         int16_t *dst, long dstWidth,
265
                         const uint8_t *src, int srcW, int xInc);
266
    void (*hcscale_fast)(struct SwsContext *c,
267
                         int16_t *dst, long dstWidth,
268
                         const uint8_t *src1, const uint8_t *src2,
269
                         int srcW, int xInc);
270

    
271
    void (*hScale)(int16_t *dst, int dstW, const uint8_t *src, int srcW,
272
                   int xInc, const int16_t *filter, const int16_t *filterPos,
273
                   long filterSize);
274

    
275
    void (*lumConvertRange)(uint16_t *dst, int width); ///< Color range conversion function for luma plane if needed.
276
    void (*chrConvertRange)(uint16_t *dst, int width); ///< Color range conversion function for chroma planes if needed.
277

    
278
    int lumSrcOffset; ///< Offset given to luma src pointers passed to horizontal input functions.
279
    int chrSrcOffset; ///< Offset given to chroma src pointers passed to horizontal input functions.
280
    int alpSrcOffset; ///< Offset given to alpha src pointers passed to horizontal input functions.
281

    
282
    int needs_hcscale; ///< Set if there are chroma planes to be converted.
283

    
284
} SwsContext;
285
//FIXME check init (where 0)
286

    
287
SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c);
288
int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
289
                             int fullRange, int brightness,
290
                             int contrast, int saturation);
291

    
292
void ff_yuv2rgb_init_tables_altivec(SwsContext *c, const int inv_table[4],
293
                                    int brightness, int contrast, int saturation);
294
SwsFunc ff_yuv2rgb_init_mmx(SwsContext *c);
295
SwsFunc ff_yuv2rgb_init_vis(SwsContext *c);
296
SwsFunc ff_yuv2rgb_init_mlib(SwsContext *c);
297
SwsFunc ff_yuv2rgb_init_altivec(SwsContext *c);
298
SwsFunc ff_yuv2rgb_get_func_ptr_bfin(SwsContext *c);
299
void ff_bfin_get_unscaled_swscale(SwsContext *c);
300
void ff_yuv2packedX_altivec(SwsContext *c,
301
                            const int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize,
302
                            const int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize,
303
                            uint8_t *dest, int dstW, int dstY);
304

    
305
const char *sws_format_name(enum PixelFormat format);
306

    
307
//FIXME replace this with something faster
308
#define is16BPS(x)      (           \
309
           (x)==PIX_FMT_GRAY16BE    \
310
        || (x)==PIX_FMT_GRAY16LE    \
311
        || (x)==PIX_FMT_RGB48BE     \
312
        || (x)==PIX_FMT_RGB48LE     \
313
        || (x)==PIX_FMT_YUV420P16LE   \
314
        || (x)==PIX_FMT_YUV422P16LE   \
315
        || (x)==PIX_FMT_YUV444P16LE   \
316
        || (x)==PIX_FMT_YUV420P16BE   \
317
        || (x)==PIX_FMT_YUV422P16BE   \
318
        || (x)==PIX_FMT_YUV444P16BE   \
319
    )
320
#define isBE(x) ((x)&1)
321
#define isPlanar8YUV(x) (           \
322
           (x)==PIX_FMT_YUV410P     \
323
        || (x)==PIX_FMT_YUV420P     \
324
        || (x)==PIX_FMT_YUVA420P    \
325
        || (x)==PIX_FMT_YUV411P     \
326
        || (x)==PIX_FMT_YUV422P     \
327
        || (x)==PIX_FMT_YUV444P     \
328
        || (x)==PIX_FMT_YUV440P     \
329
        || (x)==PIX_FMT_NV12        \
330
        || (x)==PIX_FMT_NV21        \
331
    )
332
#define isPlanarYUV(x)  (           \
333
        isPlanar8YUV(x)             \
334
        || (x)==PIX_FMT_YUV420P16LE   \
335
        || (x)==PIX_FMT_YUV422P16LE   \
336
        || (x)==PIX_FMT_YUV444P16LE   \
337
        || (x)==PIX_FMT_YUV420P16BE   \
338
        || (x)==PIX_FMT_YUV422P16BE   \
339
        || (x)==PIX_FMT_YUV444P16BE   \
340
    )
341
#define isYUV(x)        (           \
342
           (x)==PIX_FMT_UYVY422     \
343
        || (x)==PIX_FMT_YUYV422     \
344
        || isPlanarYUV(x)           \
345
    )
346
#define isGray(x)       (           \
347
           (x)==PIX_FMT_GRAY8       \
348
        || (x)==PIX_FMT_GRAY16BE    \
349
        || (x)==PIX_FMT_GRAY16LE    \
350
    )
351
#define isGray16(x)     (           \
352
           (x)==PIX_FMT_GRAY16BE    \
353
        || (x)==PIX_FMT_GRAY16LE    \
354
    )
355
#define isRGB(x)        (           \
356
           (x)==PIX_FMT_RGB48BE     \
357
        || (x)==PIX_FMT_RGB48LE     \
358
        || (x)==PIX_FMT_RGB32       \
359
        || (x)==PIX_FMT_RGB32_1     \
360
        || (x)==PIX_FMT_RGB24       \
361
        || (x)==PIX_FMT_RGB565      \
362
        || (x)==PIX_FMT_RGB555      \
363
        || (x)==PIX_FMT_RGB8        \
364
        || (x)==PIX_FMT_RGB4        \
365
        || (x)==PIX_FMT_RGB4_BYTE   \
366
        || (x)==PIX_FMT_MONOBLACK   \
367
        || (x)==PIX_FMT_MONOWHITE   \
368
    )
369
#define isBGR(x)        (           \
370
           (x)==PIX_FMT_BGR32       \
371
        || (x)==PIX_FMT_BGR32_1     \
372
        || (x)==PIX_FMT_BGR24       \
373
        || (x)==PIX_FMT_BGR565      \
374
        || (x)==PIX_FMT_BGR555      \
375
        || (x)==PIX_FMT_BGR8        \
376
        || (x)==PIX_FMT_BGR4        \
377
        || (x)==PIX_FMT_BGR4_BYTE   \
378
        || (x)==PIX_FMT_MONOBLACK   \
379
        || (x)==PIX_FMT_MONOWHITE   \
380
    )
381
#define isALPHA(x)      (           \
382
           (x)==PIX_FMT_BGR32       \
383
        || (x)==PIX_FMT_BGR32_1     \
384
        || (x)==PIX_FMT_RGB32       \
385
        || (x)==PIX_FMT_RGB32_1     \
386
        || (x)==PIX_FMT_YUVA420P    \
387
    )
388

    
389
static inline int fmt_depth(int fmt)
390
{
391
    switch(fmt) {
392
    case PIX_FMT_RGB48BE:
393
    case PIX_FMT_RGB48LE:
394
        return 48;
395
    case PIX_FMT_BGRA:
396
    case PIX_FMT_ABGR:
397
    case PIX_FMT_RGBA:
398
    case PIX_FMT_ARGB:
399
        return 32;
400
    case PIX_FMT_BGR24:
401
    case PIX_FMT_RGB24:
402
        return 24;
403
    case PIX_FMT_BGR565:
404
    case PIX_FMT_RGB565:
405
    case PIX_FMT_GRAY16BE:
406
    case PIX_FMT_GRAY16LE:
407
        return 16;
408
    case PIX_FMT_BGR555:
409
    case PIX_FMT_RGB555:
410
        return 15;
411
    case PIX_FMT_BGR8:
412
    case PIX_FMT_RGB8:
413
        return 8;
414
    case PIX_FMT_BGR4:
415
    case PIX_FMT_RGB4:
416
    case PIX_FMT_BGR4_BYTE:
417
    case PIX_FMT_RGB4_BYTE:
418
        return 4;
419
    case PIX_FMT_MONOBLACK:
420
    case PIX_FMT_MONOWHITE:
421
        return 1;
422
    default:
423
        return 0;
424
    }
425
}
426

    
427
extern const uint64_t ff_dither4[2];
428
extern const uint64_t ff_dither8[2];
429

    
430
extern const AVClass sws_context_class;
431

    
432
#endif /* SWSCALE_SWSCALE_INTERNAL_H */