CoCalc -- swscale

05. Matplotlib / ffmpeg-3.0 / libswscale / swscale_internal.h
⁵²⁸⁶⁸ views
1
/*
2
 * Copyright (C) 2001-2011 Michael Niedermayer <[email protected]>
3
 *
4
 * This file is part of FFmpeg.
5
 *
6
 * FFmpeg is free software; you can redistribute it and/or
7
 * modify it under the terms of the GNU Lesser General Public
8
 * License as published by the Free Software Foundation; either
9
 * version 2.1 of the License, or (at your option) any later version.
10
 *
11
 * FFmpeg is distributed in the hope that it will be useful,
12
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
13
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14
 * Lesser General Public License for more details.
15
 *
16
 * You should have received a copy of the GNU Lesser General Public
17
 * License along with FFmpeg; if not, write to the Free Software
18
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19
 */
20

21
#ifndef SWSCALE_SWSCALE_INTERNAL_H
22
#define SWSCALE_SWSCALE_INTERNAL_H
23

24
#include "config.h"
25

26
#if HAVE_ALTIVEC_H
27
#include <altivec.h>
28
#endif
29

30
#include "version.h"
31

32
#include "libavutil/avassert.h"
33
#include "libavutil/avutil.h"
34
#include "libavutil/common.h"
35
#include "libavutil/intreadwrite.h"
36
#include "libavutil/log.h"
37
#include "libavutil/pixfmt.h"
38
#include "libavutil/pixdesc.h"
39

40
#define STR(s) AV_TOSTRING(s) // AV_STRINGIFY is too long
41

42
#define YUVRGB_TABLE_HEADROOM 512
43
#define YUVRGB_TABLE_LUMA_HEADROOM 512
44

45
#define MAX_FILTER_SIZE SWS_MAX_FILTER_SIZE
46

47
#define DITHER1XBPP
48

49
#if HAVE_BIGENDIAN
50
#define ALT32_CORR (-1)
51
#else
52
#define ALT32_CORR   1
53
#endif
54

55
#if ARCH_X86_64
56
#   define APCK_PTR2  8
57
#   define APCK_COEF 16
58
#   define APCK_SIZE 24
59
#else
60
#   define APCK_PTR2  4
61
#   define APCK_COEF  8
62
#   define APCK_SIZE 16
63
#endif
64

65
#define RETCODE_USE_CASCADE -12345
66

67
struct SwsContext;
68

69
typedef enum SwsDither {
70
    SWS_DITHER_NONE = 0,
71
    SWS_DITHER_AUTO,
72
    SWS_DITHER_BAYER,
73
    SWS_DITHER_ED,
74
    SWS_DITHER_A_DITHER,
75
    SWS_DITHER_X_DITHER,
76
    NB_SWS_DITHER,
77
} SwsDither;
78

79
typedef enum SwsAlphaBlend {
80
    SWS_ALPHA_BLEND_NONE  = 0,
81
    SWS_ALPHA_BLEND_UNIFORM,
82
    SWS_ALPHA_BLEND_CHECKERBOARD,
83
    SWS_ALPHA_BLEND_NB,
84
} SwsAlphaBlend;
85

86
typedef int (*SwsFunc)(struct SwsContext *context, const uint8_t *src[],
87
                       int srcStride[], int srcSliceY, int srcSliceH,
88
                       uint8_t *dst[], int dstStride[]);
89

90
/**
91
 * Write one line of horizontally scaled data to planar output
92
 * without any additional vertical scaling (or point-scaling).
93
 *
94
 * @param src     scaled source data, 15bit for 8-10bit output,
95
 *                19-bit for 16bit output (in int32_t)
96
 * @param dest    pointer to the output plane. For >8bit
97
 *                output, this is in uint16_t
98
 * @param dstW    width of destination in pixels
99
 * @param dither  ordered dither array of type int16_t and size 8
100
 * @param offset  Dither offset
101
 */
102
typedef void (*yuv2planar1_fn)(const int16_t *src, uint8_t *dest, int dstW,
103
                               const uint8_t *dither, int offset);
104

105
/**
106
 * Write one line of horizontally scaled data to planar output
107
 * with multi-point vertical scaling between input pixels.
108
 *
109
 * @param filter        vertical luma/alpha scaling coefficients, 12bit [0,4096]
110
 * @param src           scaled luma (Y) or alpha (A) source data, 15bit for 8-10bit output,
111
 *                      19-bit for 16bit output (in int32_t)
112
 * @param filterSize    number of vertical input lines to scale
113
 * @param dest          pointer to output plane. For >8bit
114
 *                      output, this is in uint16_t
115
 * @param dstW          width of destination pixels
116
 * @param offset        Dither offset
117
 */
118
typedef void (*yuv2planarX_fn)(const int16_t *filter, int filterSize,
119
                               const int16_t **src, uint8_t *dest, int dstW,
120
                               const uint8_t *dither, int offset);
121

122
/**
123
 * Write one line of horizontally scaled chroma to interleaved output
124
 * with multi-point vertical scaling between input pixels.
125
 *
126
 * @param c             SWS scaling context
127
 * @param chrFilter     vertical chroma scaling coefficients, 12bit [0,4096]
128
 * @param chrUSrc       scaled chroma (U) source data, 15bit for 8-10bit output,
129
 *                      19-bit for 16bit output (in int32_t)
130
 * @param chrVSrc       scaled chroma (V) source data, 15bit for 8-10bit output,
131
 *                      19-bit for 16bit output (in int32_t)
132
 * @param chrFilterSize number of vertical chroma input lines to scale
133
 * @param dest          pointer to the output plane. For >8bit
134
 *                      output, this is in uint16_t
135
 * @param dstW          width of chroma planes
136
 */
137
typedef void (*yuv2interleavedX_fn)(struct SwsContext *c,
138
                                    const int16_t *chrFilter,
139
                                    int chrFilterSize,
140
                                    const int16_t **chrUSrc,
141
                                    const int16_t **chrVSrc,
142
                                    uint8_t *dest, int dstW);
143

144
/**
145
 * Write one line of horizontally scaled Y/U/V/A to packed-pixel YUV/RGB
146
 * output without any additional vertical scaling (or point-scaling). Note
147
 * that this function may do chroma scaling, see the "uvalpha" argument.
148
 *
149
 * @param c       SWS scaling context
150
 * @param lumSrc  scaled luma (Y) source data, 15bit for 8-10bit output,
151
 *                19-bit for 16bit output (in int32_t)
152
 * @param chrUSrc scaled chroma (U) source data, 15bit for 8-10bit output,
153
 *                19-bit for 16bit output (in int32_t)
154
 * @param chrVSrc scaled chroma (V) source data, 15bit for 8-10bit output,
155
 *                19-bit for 16bit output (in int32_t)
156
 * @param alpSrc  scaled alpha (A) source data, 15bit for 8-10bit output,
157
 *                19-bit for 16bit output (in int32_t)
158
 * @param dest    pointer to the output plane. For 16bit output, this is
159
 *                uint16_t
160
 * @param dstW    width of lumSrc and alpSrc in pixels, number of pixels
161
 *                to write into dest[]
162
 * @param uvalpha chroma scaling coefficient for the second line of chroma
163
 *                pixels, either 2048 or 0. If 0, one chroma input is used
164
 *                for 2 output pixels (or if the SWS_FLAG_FULL_CHR_INT flag
165
 *                is set, it generates 1 output pixel). If 2048, two chroma
166
 *                input pixels should be averaged for 2 output pixels (this
167
 *                only happens if SWS_FLAG_FULL_CHR_INT is not set)
168
 * @param y       vertical line number for this output. This does not need
169
 *                to be used to calculate the offset in the destination,
170
 *                but can be used to generate comfort noise using dithering
171
 *                for some output formats.
172
 */
173
typedef void (*yuv2packed1_fn)(struct SwsContext *c, const int16_t *lumSrc,
174
                               const int16_t *chrUSrc[2],
175
                               const int16_t *chrVSrc[2],
176
                               const int16_t *alpSrc, uint8_t *dest,
177
                               int dstW, int uvalpha, int y);
178
/**
179
 * Write one line of horizontally scaled Y/U/V/A to packed-pixel YUV/RGB
180
 * output by doing bilinear scaling between two input lines.
181
 *
182
 * @param c       SWS scaling context
183
 * @param lumSrc  scaled luma (Y) source data, 15bit for 8-10bit output,
184
 *                19-bit for 16bit output (in int32_t)
185
 * @param chrUSrc scaled chroma (U) source data, 15bit for 8-10bit output,
186
 *                19-bit for 16bit output (in int32_t)
187
 * @param chrVSrc scaled chroma (V) source data, 15bit for 8-10bit output,
188
 *                19-bit for 16bit output (in int32_t)
189
 * @param alpSrc  scaled alpha (A) source data, 15bit for 8-10bit output,
190
 *                19-bit for 16bit output (in int32_t)
191
 * @param dest    pointer to the output plane. For 16bit output, this is
192
 *                uint16_t
193
 * @param dstW    width of lumSrc and alpSrc in pixels, number of pixels
194
 *                to write into dest[]
195
 * @param yalpha  luma/alpha scaling coefficients for the second input line.
196
 *                The first line's coefficients can be calculated by using
197
 *                4096 - yalpha
198
 * @param uvalpha chroma scaling coefficient for the second input line. The
199
 *                first line's coefficients can be calculated by using
200
 *                4096 - uvalpha
201
 * @param y       vertical line number for this output. This does not need
202
 *                to be used to calculate the offset in the destination,
203
 *                but can be used to generate comfort noise using dithering
204
 *                for some output formats.
205
 */
206
typedef void (*yuv2packed2_fn)(struct SwsContext *c, const int16_t *lumSrc[2],
207
                               const int16_t *chrUSrc[2],
208
                               const int16_t *chrVSrc[2],
209
                               const int16_t *alpSrc[2],
210
                               uint8_t *dest,
211
                               int dstW, int yalpha, int uvalpha, int y);
212
/**
213
 * Write one line of horizontally scaled Y/U/V/A to packed-pixel YUV/RGB
214
 * output by doing multi-point vertical scaling between input pixels.
215
 *
216
 * @param c             SWS scaling context
217
 * @param lumFilter     vertical luma/alpha scaling coefficients, 12bit [0,4096]
218
 * @param lumSrc        scaled luma (Y) source data, 15bit for 8-10bit output,
219
 *                      19-bit for 16bit output (in int32_t)
220
 * @param lumFilterSize number of vertical luma/alpha input lines to scale
221
 * @param chrFilter     vertical chroma scaling coefficients, 12bit [0,4096]
222
 * @param chrUSrc       scaled chroma (U) source data, 15bit for 8-10bit output,
223
 *                      19-bit for 16bit output (in int32_t)
224
 * @param chrVSrc       scaled chroma (V) source data, 15bit for 8-10bit output,
225
 *                      19-bit for 16bit output (in int32_t)
226
 * @param chrFilterSize number of vertical chroma input lines to scale
227
 * @param alpSrc        scaled alpha (A) source data, 15bit for 8-10bit output,
228
 *                      19-bit for 16bit output (in int32_t)
229
 * @param dest          pointer to the output plane. For 16bit output, this is
230
 *                      uint16_t
231
 * @param dstW          width of lumSrc and alpSrc in pixels, number of pixels
232
 *                      to write into dest[]
233
 * @param y             vertical line number for this output. This does not need
234
 *                      to be used to calculate the offset in the destination,
235
 *                      but can be used to generate comfort noise using dithering
236
 *                      or some output formats.
237
 */
238
typedef void (*yuv2packedX_fn)(struct SwsContext *c, const int16_t *lumFilter,
239
                               const int16_t **lumSrc, int lumFilterSize,
240
                               const int16_t *chrFilter,
241
                               const int16_t **chrUSrc,
242
                               const int16_t **chrVSrc, int chrFilterSize,
243
                               const int16_t **alpSrc, uint8_t *dest,
244
                               int dstW, int y);
245

246
/**
247
 * Write one line of horizontally scaled Y/U/V/A to YUV/RGB
248
 * output by doing multi-point vertical scaling between input pixels.
249
 *
250
 * @param c             SWS scaling context
251
 * @param lumFilter     vertical luma/alpha scaling coefficients, 12bit [0,4096]
252
 * @param lumSrc        scaled luma (Y) source data, 15bit for 8-10bit output,
253
 *                      19-bit for 16bit output (in int32_t)
254
 * @param lumFilterSize number of vertical luma/alpha input lines to scale
255
 * @param chrFilter     vertical chroma scaling coefficients, 12bit [0,4096]
256
 * @param chrUSrc       scaled chroma (U) source data, 15bit for 8-10bit output,
257
 *                      19-bit for 16bit output (in int32_t)
258
 * @param chrVSrc       scaled chroma (V) source data, 15bit for 8-10bit output,
259
 *                      19-bit for 16bit output (in int32_t)
260
 * @param chrFilterSize number of vertical chroma input lines to scale
261
 * @param alpSrc        scaled alpha (A) source data, 15bit for 8-10bit output,
262
 *                      19-bit for 16bit output (in int32_t)
263
 * @param dest          pointer to the output planes. For 16bit output, this is
264
 *                      uint16_t
265
 * @param dstW          width of lumSrc and alpSrc in pixels, number of pixels
266
 *                      to write into dest[]
267
 * @param y             vertical line number for this output. This does not need
268
 *                      to be used to calculate the offset in the destination,
269
 *                      but can be used to generate comfort noise using dithering
270
 *                      or some output formats.
271
 */
272
typedef void (*yuv2anyX_fn)(struct SwsContext *c, const int16_t *lumFilter,
273
                            const int16_t **lumSrc, int lumFilterSize,
274
                            const int16_t *chrFilter,
275
                            const int16_t **chrUSrc,
276
                            const int16_t **chrVSrc, int chrFilterSize,
277
                            const int16_t **alpSrc, uint8_t **dest,
278
                            int dstW, int y);
279

280
struct SwsSlice;
281
struct SwsFilterDescriptor;
282

283
/* This struct should be aligned on at least a 32-byte boundary. */
284
typedef struct SwsContext {
285
    /**
286
     * info on struct for av_log
287
     */
288
    const AVClass *av_class;
289

290
    /**
291
     * Note that src, dst, srcStride, dstStride will be copied in the
292
     * sws_scale() wrapper so they can be freely modified here.
293
     */
294
    SwsFunc swscale;
295
    int srcW;                     ///< Width  of source      luma/alpha planes.
296
    int srcH;                     ///< Height of source      luma/alpha planes.
297
    int dstH;                     ///< Height of destination luma/alpha planes.
298
    int chrSrcW;                  ///< Width  of source      chroma     planes.
299
    int chrSrcH;                  ///< Height of source      chroma     planes.
300
    int chrDstW;                  ///< Width  of destination chroma     planes.
301
    int chrDstH;                  ///< Height of destination chroma     planes.
302
    int lumXInc, chrXInc;
303
    int lumYInc, chrYInc;
304
    enum AVPixelFormat dstFormat; ///< Destination pixel format.
305
    enum AVPixelFormat srcFormat; ///< Source      pixel format.
306
    int dstFormatBpp;             ///< Number of bits per pixel of the destination pixel format.
307
    int srcFormatBpp;             ///< Number of bits per pixel of the source      pixel format.
308
    int dstBpc, srcBpc;
309
    int chrSrcHSubSample;         ///< Binary logarithm of horizontal subsampling factor between luma/alpha and chroma planes in source      image.
310
    int chrSrcVSubSample;         ///< Binary logarithm of vertical   subsampling factor between luma/alpha and chroma planes in source      image.
311
    int chrDstHSubSample;         ///< Binary logarithm of horizontal subsampling factor between luma/alpha and chroma planes in destination image.
312
    int chrDstVSubSample;         ///< Binary logarithm of vertical   subsampling factor between luma/alpha and chroma planes in destination image.
313
    int vChrDrop;                 ///< Binary logarithm of extra vertical subsampling factor in source image chroma planes specified by user.
314
    int sliceDir;                 ///< Direction that slices are fed to the scaler (1 = top-to-bottom, -1 = bottom-to-top).
315
    double param[2];              ///< Input parameters for scaling algorithms that need them.
316

317
    /* The cascaded_* fields allow spliting a scaler task into multiple
318
     * sequential steps, this is for example used to limit the maximum
319
     * downscaling factor that needs to be supported in one scaler.
320
     */
321
    struct SwsContext *cascaded_context[3];
322
    int cascaded_tmpStride[4];
323
    uint8_t *cascaded_tmp[4];
324
    int cascaded1_tmpStride[4];
325
    uint8_t *cascaded1_tmp[4];
326
    int cascaded_mainindex;
327

328
    double gamma_value;
329
    int gamma_flag;
330
    int is_internal_gamma;
331
    uint16_t *gamma;
332
    uint16_t *inv_gamma;
333

334
    int numDesc;
335
    int descIndex[2];
336
    int numSlice;
337
    struct SwsSlice *slice;
338
    struct SwsFilterDescriptor *desc;
339

340
    uint32_t pal_yuv[256];
341
    uint32_t pal_rgb[256];
342

343
    /**
344
     * @name Scaled horizontal lines ring buffer.
345
     * The horizontal scaler keeps just enough scaled lines in a ring buffer
346
     * so they may be passed to the vertical scaler. The pointers to the
347
     * allocated buffers for each line are duplicated in sequence in the ring
348
     * buffer to simplify indexing and avoid wrapping around between lines
349
     * inside the vertical scaler code. The wrapping is done before the
350
     * vertical scaler is called.
351
     */
352
    //@{
353
    int16_t **lumPixBuf;          ///< Ring buffer for scaled horizontal luma   plane lines to be fed to the vertical scaler.
354
    int16_t **chrUPixBuf;         ///< Ring buffer for scaled horizontal chroma plane lines to be fed to the vertical scaler.
355
    int16_t **chrVPixBuf;         ///< Ring buffer for scaled horizontal chroma plane lines to be fed to the vertical scaler.
356
    int16_t **alpPixBuf;          ///< Ring buffer for scaled horizontal alpha  plane lines to be fed to the vertical scaler.
357
    int vLumBufSize;              ///< Number of vertical luma/alpha lines allocated in the ring buffer.
358
    int vChrBufSize;              ///< Number of vertical chroma     lines allocated in the ring buffer.
359
    int lastInLumBuf;             ///< Last scaled horizontal luma/alpha line from source in the ring buffer.
360
    int lastInChrBuf;             ///< Last scaled horizontal chroma     line from source in the ring buffer.
361
    int lumBufIndex;              ///< Index in ring buffer of the last scaled horizontal luma/alpha line from source.
362
    int chrBufIndex;              ///< Index in ring buffer of the last scaled horizontal chroma     line from source.
363
    //@}
364

365
    uint8_t *formatConvBuffer;
366

367
    /**
368
     * @name Horizontal and vertical filters.
369
     * To better understand the following fields, here is a pseudo-code of
370
     * their usage in filtering a horizontal line:
371
     * @code
372
     * for (i = 0; i < width; i++) {
373
     *     dst[i] = 0;
374
     *     for (j = 0; j < filterSize; j++)
375
     *         dst[i] += src[ filterPos[i] + j ] * filter[ filterSize * i + j ];
376
     *     dst[i] >>= FRAC_BITS; // The actual implementation is fixed-point.
377
     * }
378
     * @endcode
379
     */
380
    //@{
381
    int16_t *hLumFilter;          ///< Array of horizontal filter coefficients for luma/alpha planes.
382
    int16_t *hChrFilter;          ///< Array of horizontal filter coefficients for chroma     planes.
383
    int16_t *vLumFilter;          ///< Array of vertical   filter coefficients for luma/alpha planes.
384
    int16_t *vChrFilter;          ///< Array of vertical   filter coefficients for chroma     planes.
385
    int32_t *hLumFilterPos;       ///< Array of horizontal filter starting positions for each dst[i] for luma/alpha planes.
386
    int32_t *hChrFilterPos;       ///< Array of horizontal filter starting positions for each dst[i] for chroma     planes.
387
    int32_t *vLumFilterPos;       ///< Array of vertical   filter starting positions for each dst[i] for luma/alpha planes.
388
    int32_t *vChrFilterPos;       ///< Array of vertical   filter starting positions for each dst[i] for chroma     planes.
389
    int hLumFilterSize;           ///< Horizontal filter size for luma/alpha pixels.
390
    int hChrFilterSize;           ///< Horizontal filter size for chroma     pixels.
391
    int vLumFilterSize;           ///< Vertical   filter size for luma/alpha pixels.
392
    int vChrFilterSize;           ///< Vertical   filter size for chroma     pixels.
393
    //@}
394

395
    int lumMmxextFilterCodeSize;  ///< Runtime-generated MMXEXT horizontal fast bilinear scaler code size for luma/alpha planes.
396
    int chrMmxextFilterCodeSize;  ///< Runtime-generated MMXEXT horizontal fast bilinear scaler code size for chroma planes.
397
    uint8_t *lumMmxextFilterCode; ///< Runtime-generated MMXEXT horizontal fast bilinear scaler code for luma/alpha planes.
398
    uint8_t *chrMmxextFilterCode; ///< Runtime-generated MMXEXT horizontal fast bilinear scaler code for chroma planes.
399

400
    int canMMXEXTBeUsed;
401
    int warned_unuseable_bilinear;
402

403
    int dstY;                     ///< Last destination vertical line output from last slice.
404
    int flags;                    ///< Flags passed by the user to select scaler algorithm, optimizations, subsampling, etc...
405
    void *yuvTable;             // pointer to the yuv->rgb table start so it can be freed()
406
    // alignment ensures the offset can be added in a single
407
    // instruction on e.g. ARM
408
    DECLARE_ALIGNED(16, int, table_gV)[256 + 2*YUVRGB_TABLE_HEADROOM];
409
    uint8_t *table_rV[256 + 2*YUVRGB_TABLE_HEADROOM];
410
    uint8_t *table_gU[256 + 2*YUVRGB_TABLE_HEADROOM];
411
    uint8_t *table_bU[256 + 2*YUVRGB_TABLE_HEADROOM];
412
    DECLARE_ALIGNED(16, int32_t, input_rgb2yuv_table)[16+40*4]; // This table can contain both C and SIMD formatted values, the C vales are always at the XY_IDX points
413
#define RY_IDX 0
414
#define GY_IDX 1
415
#define BY_IDX 2
416
#define RU_IDX 3
417
#define GU_IDX 4
418
#define BU_IDX 5
419
#define RV_IDX 6
420
#define GV_IDX 7
421
#define BV_IDX 8
422
#define RGB2YUV_SHIFT 15
423

424
    int *dither_error[4];
425

426
    //Colorspace stuff
427
    int contrast, brightness, saturation;    // for sws_getColorspaceDetails
428
    int srcColorspaceTable[4];
429
    int dstColorspaceTable[4];
430
    int srcRange;                 ///< 0 = MPG YUV range, 1 = JPG YUV range (source      image).
431
    int dstRange;                 ///< 0 = MPG YUV range, 1 = JPG YUV range (destination image).
432
    int src0Alpha;
433
    int dst0Alpha;
434
    int srcXYZ;
435
    int dstXYZ;
436
    int src_h_chr_pos;
437
    int dst_h_chr_pos;
438
    int src_v_chr_pos;
439
    int dst_v_chr_pos;
440
    int yuv2rgb_y_offset;
441
    int yuv2rgb_y_coeff;
442
    int yuv2rgb_v2r_coeff;
443
    int yuv2rgb_v2g_coeff;
444
    int yuv2rgb_u2g_coeff;
445
    int yuv2rgb_u2b_coeff;
446

447
#define RED_DITHER            "0*8"
448
#define GREEN_DITHER          "1*8"
449
#define BLUE_DITHER           "2*8"
450
#define Y_COEFF               "3*8"
451
#define VR_COEFF              "4*8"
452
#define UB_COEFF              "5*8"
453
#define VG_COEFF              "6*8"
454
#define UG_COEFF              "7*8"
455
#define Y_OFFSET              "8*8"
456
#define U_OFFSET              "9*8"
457
#define V_OFFSET              "10*8"
458
#define LUM_MMX_FILTER_OFFSET "11*8"
459
#define CHR_MMX_FILTER_OFFSET "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)
460
#define DSTW_OFFSET           "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*2"
461
#define ESP_OFFSET            "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*2+8"
462
#define VROUNDER_OFFSET       "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*2+16"
463
#define U_TEMP                "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*2+24"
464
#define V_TEMP                "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*2+32"
465
#define Y_TEMP                "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*2+40"
466
#define ALP_MMX_FILTER_OFFSET "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*2+48"
467
#define UV_OFF_PX             "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*3+48"
468
#define UV_OFF_BYTE           "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*3+56"
469
#define DITHER16              "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*3+64"
470
#define DITHER32              "11*8+4*4*"AV_STRINGIFY(MAX_FILTER_SIZE)"*3+80"
471
#define DITHER32_INT          (11*8+4*4*MAX_FILTER_SIZE*3+80) // value equal to above, used for checking that the struct hasn't been changed by mistake
472

473
    DECLARE_ALIGNED(8, uint64_t, redDither);
474
    DECLARE_ALIGNED(8, uint64_t, greenDither);
475
    DECLARE_ALIGNED(8, uint64_t, blueDither);
476

477
    DECLARE_ALIGNED(8, uint64_t, yCoeff);
478
    DECLARE_ALIGNED(8, uint64_t, vrCoeff);
479
    DECLARE_ALIGNED(8, uint64_t, ubCoeff);
480
    DECLARE_ALIGNED(8, uint64_t, vgCoeff);
481
    DECLARE_ALIGNED(8, uint64_t, ugCoeff);
482
    DECLARE_ALIGNED(8, uint64_t, yOffset);
483
    DECLARE_ALIGNED(8, uint64_t, uOffset);
484
    DECLARE_ALIGNED(8, uint64_t, vOffset);
485
    int32_t lumMmxFilter[4 * MAX_FILTER_SIZE];
486
    int32_t chrMmxFilter[4 * MAX_FILTER_SIZE];
487
    int dstW;                     ///< Width  of destination luma/alpha planes.
488
    DECLARE_ALIGNED(8, uint64_t, esp);
489
    DECLARE_ALIGNED(8, uint64_t, vRounder);
490
    DECLARE_ALIGNED(8, uint64_t, u_temp);
491
    DECLARE_ALIGNED(8, uint64_t, v_temp);
492
    DECLARE_ALIGNED(8, uint64_t, y_temp);
493
    int32_t alpMmxFilter[4 * MAX_FILTER_SIZE];
494
    // alignment of these values is not necessary, but merely here
495
    // to maintain the same offset across x8632 and x86-64. Once we
496
    // use proper offset macros in the asm, they can be removed.
497
    DECLARE_ALIGNED(8, ptrdiff_t, uv_off); ///< offset (in pixels) between u and v planes
498
    DECLARE_ALIGNED(8, ptrdiff_t, uv_offx2); ///< offset (in bytes) between u and v planes
499
    DECLARE_ALIGNED(8, uint16_t, dither16)[8];
500
    DECLARE_ALIGNED(8, uint32_t, dither32)[8];
501

502
    const uint8_t *chrDither8, *lumDither8;
503

504
#if HAVE_ALTIVEC
505
    vector signed short   CY;
506
    vector signed short   CRV;
507
    vector signed short   CBU;
508
    vector signed short   CGU;
509
    vector signed short   CGV;
510
    vector signed short   OY;
511
    vector unsigned short CSHIFT;
512
    vector signed short  *vYCoeffsBank, *vCCoeffsBank;
513
#endif
514

515
    int use_mmx_vfilter;
516

517
/* pre defined color-spaces gamma */
518
#define XYZ_GAMMA (2.6f)
519
#define RGB_GAMMA (2.2f)
520
    int16_t *xyzgamma;
521
    int16_t *rgbgamma;
522
    int16_t *xyzgammainv;
523
    int16_t *rgbgammainv;
524
    int16_t xyz2rgb_matrix[3][4];
525
    int16_t rgb2xyz_matrix[3][4];
526

527
    /* function pointers for swscale() */
528
    yuv2planar1_fn yuv2plane1;
529
    yuv2planarX_fn yuv2planeX;
530
    yuv2interleavedX_fn yuv2nv12cX;
531
    yuv2packed1_fn yuv2packed1;
532
    yuv2packed2_fn yuv2packed2;
533
    yuv2packedX_fn yuv2packedX;
534
    yuv2anyX_fn yuv2anyX;
535

536
    /// Unscaled conversion of luma plane to YV12 for horizontal scaler.
537
    void (*lumToYV12)(uint8_t *dst, const uint8_t *src, const uint8_t *src2, const uint8_t *src3,
538
                      int width, uint32_t *pal);
539
    /// Unscaled conversion of alpha plane to YV12 for horizontal scaler.
540
    void (*alpToYV12)(uint8_t *dst, const uint8_t *src, const uint8_t *src2, const uint8_t *src3,
541
                      int width, uint32_t *pal);
542
    /// Unscaled conversion of chroma planes to YV12 for horizontal scaler.
543
    void (*chrToYV12)(uint8_t *dstU, uint8_t *dstV,
544
                      const uint8_t *src1, const uint8_t *src2, const uint8_t *src3,
545
                      int width, uint32_t *pal);
546

547
    /**
548
     * Functions to read planar input, such as planar RGB, and convert
549
     * internally to Y/UV/A.
550
     */
551
    /** @{ */
552
    void (*readLumPlanar)(uint8_t *dst, const uint8_t *src[4], int width, int32_t *rgb2yuv);
553
    void (*readChrPlanar)(uint8_t *dstU, uint8_t *dstV, const uint8_t *src[4],
554
                          int width, int32_t *rgb2yuv);
555
    void (*readAlpPlanar)(uint8_t *dst, const uint8_t *src[4], int width, int32_t *rgb2yuv);
556
    /** @} */
557

558
    /**
559
     * Scale one horizontal line of input data using a bilinear filter
560
     * to produce one line of output data. Compared to SwsContext->hScale(),
561
     * please take note of the following caveats when using these:
562
     * - Scaling is done using only 7bit instead of 14bit coefficients.
563
     * - You can use no more than 5 input pixels to produce 4 output
564
     *   pixels. Therefore, this filter should not be used for downscaling
565
     *   by more than ~20% in width (because that equals more than 5/4th
566
     *   downscaling and thus more than 5 pixels input per 4 pixels output).
567
     * - In general, bilinear filters create artifacts during downscaling
568
     *   (even when <20%), because one output pixel will span more than one
569
     *   input pixel, and thus some pixels will need edges of both neighbor
570
     *   pixels to interpolate the output pixel. Since you can use at most
571
     *   two input pixels per output pixel in bilinear scaling, this is
572
     *   impossible and thus downscaling by any size will create artifacts.
573
     * To enable this type of scaling, set SWS_FLAG_FAST_BILINEAR
574
     * in SwsContext->flags.
575
     */
576
    /** @{ */
577
    void (*hyscale_fast)(struct SwsContext *c,
578
                         int16_t *dst, int dstWidth,
579
                         const uint8_t *src, int srcW, int xInc);
580
    void (*hcscale_fast)(struct SwsContext *c,
581
                         int16_t *dst1, int16_t *dst2, int dstWidth,
582
                         const uint8_t *src1, const uint8_t *src2,
583
                         int srcW, int xInc);
584
    /** @} */
585

586
    /**
587
     * Scale one horizontal line of input data using a filter over the input
588
     * lines, to produce one (differently sized) line of output data.
589
     *
590
     * @param dst        pointer to destination buffer for horizontally scaled
591
     *                   data. If the number of bits per component of one
592
     *                   destination pixel (SwsContext->dstBpc) is <= 10, data
593
     *                   will be 15bpc in 16bits (int16_t) width. Else (i.e.
594
     *                   SwsContext->dstBpc == 16), data will be 19bpc in
595
     *                   32bits (int32_t) width.
596
     * @param dstW       width of destination image
597
     * @param src        pointer to source data to be scaled. If the number of
598
     *                   bits per component of a source pixel (SwsContext->srcBpc)
599
     *                   is 8, this is 8bpc in 8bits (uint8_t) width. Else
600
     *                   (i.e. SwsContext->dstBpc > 8), this is native depth
601
     *                   in 16bits (uint16_t) width. In other words, for 9-bit
602
     *                   YUV input, this is 9bpc, for 10-bit YUV input, this is
603
     *                   10bpc, and for 16-bit RGB or YUV, this is 16bpc.
604
     * @param filter     filter coefficients to be used per output pixel for
605
     *                   scaling. This contains 14bpp filtering coefficients.
606
     *                   Guaranteed to contain dstW * filterSize entries.
607
     * @param filterPos  position of the first input pixel to be used for
608
     *                   each output pixel during scaling. Guaranteed to
609
     *                   contain dstW entries.
610
     * @param filterSize the number of input coefficients to be used (and
611
     *                   thus the number of input pixels to be used) for
612
     *                   creating a single output pixel. Is aligned to 4
613
     *                   (and input coefficients thus padded with zeroes)
614
     *                   to simplify creating SIMD code.
615
     */
616
    /** @{ */
617
    void (*hyScale)(struct SwsContext *c, int16_t *dst, int dstW,
618
                    const uint8_t *src, const int16_t *filter,
619
                    const int32_t *filterPos, int filterSize);
620
    void (*hcScale)(struct SwsContext *c, int16_t *dst, int dstW,
621
                    const uint8_t *src, const int16_t *filter,
622
                    const int32_t *filterPos, int filterSize);
623
    /** @} */
624

625
    /// Color range conversion function for luma plane if needed.
626
    void (*lumConvertRange)(int16_t *dst, int width);
627
    /// Color range conversion function for chroma planes if needed.
628
    void (*chrConvertRange)(int16_t *dst1, int16_t *dst2, int width);
629

630
    int needs_hcscale; ///< Set if there are chroma planes to be converted.
631

632
    SwsDither dither;
633

634
    SwsAlphaBlend alphablend;
635
} SwsContext;
636
//FIXME check init (where 0)
637

638
SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c);
639
int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
640
                             int fullRange, int brightness,
641
                             int contrast, int saturation);
642
void ff_yuv2rgb_init_tables_ppc(SwsContext *c, const int inv_table[4],
643
                                int brightness, int contrast, int saturation);
644

645
void ff_updateMMXDitherTables(SwsContext *c, int dstY, int lumBufIndex, int chrBufIndex,
646
                           int lastInLumBuf, int lastInChrBuf);
647

648
av_cold void ff_sws_init_range_convert(SwsContext *c);
649

650
SwsFunc ff_yuv2rgb_init_x86(SwsContext *c);
651
SwsFunc ff_yuv2rgb_init_ppc(SwsContext *c);
652

653
static av_always_inline int is16BPS(enum AVPixelFormat pix_fmt)
654
{
655
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
656
    av_assert0(desc);
657
    return desc->comp[0].depth == 16;
658
}
659

660
static av_always_inline int is9_OR_10BPS(enum AVPixelFormat pix_fmt)
661
{
662
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
663
    av_assert0(desc);
664
    return desc->comp[0].depth >= 9 && desc->comp[0].depth <= 14;
665
}
666

667
#define isNBPS(x) is9_OR_10BPS(x)
668

669
static av_always_inline int isBE(enum AVPixelFormat pix_fmt)
670
{
671
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
672
    av_assert0(desc);
673
    return desc->flags & AV_PIX_FMT_FLAG_BE;
674
}
675

676
static av_always_inline int isYUV(enum AVPixelFormat pix_fmt)
677
{
678
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
679
    av_assert0(desc);
680
    return !(desc->flags & AV_PIX_FMT_FLAG_RGB) && desc->nb_components >= 2;
681
}
682

683
static av_always_inline int isPlanarYUV(enum AVPixelFormat pix_fmt)
684
{
685
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
686
    av_assert0(desc);
687
    return ((desc->flags & AV_PIX_FMT_FLAG_PLANAR) && isYUV(pix_fmt));
688
}
689

690
static av_always_inline int isRGB(enum AVPixelFormat pix_fmt)
691
{
692
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
693
    av_assert0(desc);
694
    return (desc->flags & AV_PIX_FMT_FLAG_RGB);
695
}
696

697
#if 0 // FIXME
698
#define isGray(x) \
699
    (!(av_pix_fmt_desc_get(x)->flags & AV_PIX_FMT_FLAG_PAL) && \
700
     av_pix_fmt_desc_get(x)->nb_components <= 2)
701
#else
702
#define isGray(x)                      \
703
    ((x) == AV_PIX_FMT_GRAY8       ||  \
704
     (x) == AV_PIX_FMT_YA8         ||  \
705
     (x) == AV_PIX_FMT_GRAY16BE    ||  \
706
     (x) == AV_PIX_FMT_GRAY16LE    ||  \
707
     (x) == AV_PIX_FMT_YA16BE      ||  \
708
     (x) == AV_PIX_FMT_YA16LE)
709
#endif
710

711
#define isRGBinInt(x) \
712
    (           \
713
     (x) == AV_PIX_FMT_RGB48BE     ||  \
714
     (x) == AV_PIX_FMT_RGB48LE     ||  \
715
     (x) == AV_PIX_FMT_RGB32       ||  \
716
     (x) == AV_PIX_FMT_RGB32_1     ||  \
717
     (x) == AV_PIX_FMT_RGB24       ||  \
718
     (x) == AV_PIX_FMT_RGB565BE    ||  \
719
     (x) == AV_PIX_FMT_RGB565LE    ||  \
720
     (x) == AV_PIX_FMT_RGB555BE    ||  \
721
     (x) == AV_PIX_FMT_RGB555LE    ||  \
722
     (x) == AV_PIX_FMT_RGB444BE    ||  \
723
     (x) == AV_PIX_FMT_RGB444LE    ||  \
724
     (x) == AV_PIX_FMT_RGB8        ||  \
725
     (x) == AV_PIX_FMT_RGB4        ||  \
726
     (x) == AV_PIX_FMT_RGB4_BYTE   ||  \
727
     (x) == AV_PIX_FMT_RGBA64BE    ||  \
728
     (x) == AV_PIX_FMT_RGBA64LE    ||  \
729
     (x) == AV_PIX_FMT_MONOBLACK   ||  \
730
     (x) == AV_PIX_FMT_MONOWHITE   \
731
    )
732
#define isBGRinInt(x) \
733
    (           \
734
     (x) == AV_PIX_FMT_BGR48BE     ||  \
735
     (x) == AV_PIX_FMT_BGR48LE     ||  \
736
     (x) == AV_PIX_FMT_BGR32       ||  \
737
     (x) == AV_PIX_FMT_BGR32_1     ||  \
738
     (x) == AV_PIX_FMT_BGR24       ||  \
739
     (x) == AV_PIX_FMT_BGR565BE    ||  \
740
     (x) == AV_PIX_FMT_BGR565LE    ||  \
741
     (x) == AV_PIX_FMT_BGR555BE    ||  \
742
     (x) == AV_PIX_FMT_BGR555LE    ||  \
743
     (x) == AV_PIX_FMT_BGR444BE    ||  \
744
     (x) == AV_PIX_FMT_BGR444LE    ||  \
745
     (x) == AV_PIX_FMT_BGR8        ||  \
746
     (x) == AV_PIX_FMT_BGR4        ||  \
747
     (x) == AV_PIX_FMT_BGR4_BYTE   ||  \
748
     (x) == AV_PIX_FMT_BGRA64BE    ||  \
749
     (x) == AV_PIX_FMT_BGRA64LE    ||  \
750
     (x) == AV_PIX_FMT_MONOBLACK   ||  \
751
     (x) == AV_PIX_FMT_MONOWHITE   \
752
    )
753

754
#define isRGBinBytes(x) (           \
755
           (x) == AV_PIX_FMT_RGB48BE     \
756
        || (x) == AV_PIX_FMT_RGB48LE     \
757
        || (x) == AV_PIX_FMT_RGBA64BE    \
758
        || (x) == AV_PIX_FMT_RGBA64LE    \
759
        || (x) == AV_PIX_FMT_RGBA        \
760
        || (x) == AV_PIX_FMT_ARGB        \
761
        || (x) == AV_PIX_FMT_RGB24       \
762
    )
763
#define isBGRinBytes(x) (           \
764
           (x) == AV_PIX_FMT_BGR48BE     \
765
        || (x) == AV_PIX_FMT_BGR48LE     \
766
        || (x) == AV_PIX_FMT_BGRA64BE    \
767
        || (x) == AV_PIX_FMT_BGRA64LE    \
768
        || (x) == AV_PIX_FMT_BGRA        \
769
        || (x) == AV_PIX_FMT_ABGR        \
770
        || (x) == AV_PIX_FMT_BGR24       \
771
    )
772

773
#define isBayer(x) ( \
774
           (x)==AV_PIX_FMT_BAYER_BGGR8    \
775
        || (x)==AV_PIX_FMT_BAYER_BGGR16LE \
776
        || (x)==AV_PIX_FMT_BAYER_BGGR16BE \
777
        || (x)==AV_PIX_FMT_BAYER_RGGB8    \
778
        || (x)==AV_PIX_FMT_BAYER_RGGB16LE \
779
        || (x)==AV_PIX_FMT_BAYER_RGGB16BE \
780
        || (x)==AV_PIX_FMT_BAYER_GBRG8    \
781
        || (x)==AV_PIX_FMT_BAYER_GBRG16LE \
782
        || (x)==AV_PIX_FMT_BAYER_GBRG16BE \
783
        || (x)==AV_PIX_FMT_BAYER_GRBG8    \
784
        || (x)==AV_PIX_FMT_BAYER_GRBG16LE \
785
        || (x)==AV_PIX_FMT_BAYER_GRBG16BE \
786
    )
787

788
#define isAnyRGB(x) \
789
    (           \
790
          isBayer(x)          ||    \
791
          isRGBinInt(x)       ||    \
792
          isBGRinInt(x)       ||    \
793
          isRGB(x)      \
794
    )
795

796
static av_always_inline int isALPHA(enum AVPixelFormat pix_fmt)
797
{
798
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
799
    av_assert0(desc);
800
    if (pix_fmt == AV_PIX_FMT_PAL8)
801
        return 1;
802
    return desc->flags & AV_PIX_FMT_FLAG_ALPHA;
803
}
804

805
#if 1
806
#define isPacked(x)         (       \
807
           (x)==AV_PIX_FMT_PAL8        \
808
        || (x)==AV_PIX_FMT_YUYV422     \
809
        || (x)==AV_PIX_FMT_YVYU422     \
810
        || (x)==AV_PIX_FMT_UYVY422     \
811
        || (x)==AV_PIX_FMT_YA8       \
812
        || (x)==AV_PIX_FMT_YA16LE      \
813
        || (x)==AV_PIX_FMT_YA16BE      \
814
        || (x)==AV_PIX_FMT_AYUV64LE    \
815
        || (x)==AV_PIX_FMT_AYUV64BE    \
816
        ||  isRGBinInt(x)           \
817
        ||  isBGRinInt(x)           \
818
    )
819
#else
820
static av_always_inline int isPacked(enum AVPixelFormat pix_fmt)
821
{
822
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
823
    av_assert0(desc);
824
    return ((desc->nb_components >= 2 && !(desc->flags & AV_PIX_FMT_FLAG_PLANAR)) ||
825
            pix_fmt == AV_PIX_FMT_PAL8);
826
}
827

828
#endif
829
static av_always_inline int isPlanar(enum AVPixelFormat pix_fmt)
830
{
831
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
832
    av_assert0(desc);
833
    return (desc->nb_components >= 2 && (desc->flags & AV_PIX_FMT_FLAG_PLANAR));
834
}
835

836
static av_always_inline int isPackedRGB(enum AVPixelFormat pix_fmt)
837
{
838
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
839
    av_assert0(desc);
840
    return ((desc->flags & (AV_PIX_FMT_FLAG_PLANAR | AV_PIX_FMT_FLAG_RGB)) == AV_PIX_FMT_FLAG_RGB);
841
}
842

843
static av_always_inline int isPlanarRGB(enum AVPixelFormat pix_fmt)
844
{
845
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
846
    av_assert0(desc);
847
    return ((desc->flags & (AV_PIX_FMT_FLAG_PLANAR | AV_PIX_FMT_FLAG_RGB)) ==
848
            (AV_PIX_FMT_FLAG_PLANAR | AV_PIX_FMT_FLAG_RGB));
849
}
850

851
static av_always_inline int usePal(enum AVPixelFormat pix_fmt)
852
{
853
    const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(pix_fmt);
854
    av_assert0(desc);
855
    return (desc->flags & AV_PIX_FMT_FLAG_PAL) || (desc->flags & AV_PIX_FMT_FLAG_PSEUDOPAL);
856
}
857

858
extern const uint64_t ff_dither4[2];
859
extern const uint64_t ff_dither8[2];
860

861
extern const uint8_t ff_dither_2x2_4[3][8];
862
extern const uint8_t ff_dither_2x2_8[3][8];
863
extern const uint8_t ff_dither_4x4_16[5][8];
864
extern const uint8_t ff_dither_8x8_32[9][8];
865
extern const uint8_t ff_dither_8x8_73[9][8];
866
extern const uint8_t ff_dither_8x8_128[9][8];
867
extern const uint8_t ff_dither_8x8_220[9][8];
868

869
extern const int32_t ff_yuv2rgb_coeffs[8][4];
870

871
extern const AVClass ff_sws_context_class;
872

873
/**
874
 * Set c->swscale to an unscaled converter if one exists for the specific
875
 * source and destination formats, bit depths, flags, etc.
876
 */
877
void ff_get_unscaled_swscale(SwsContext *c);
878
void ff_get_unscaled_swscale_ppc(SwsContext *c);
879
void ff_get_unscaled_swscale_arm(SwsContext *c);
880

881
/**
882
 * Return function pointer to fastest main scaler path function depending
883
 * on architecture and available optimizations.
884
 */
885
SwsFunc ff_getSwsFunc(SwsContext *c);
886

887
void ff_sws_init_input_funcs(SwsContext *c);
888
void ff_sws_init_output_funcs(SwsContext *c,
889
                              yuv2planar1_fn *yuv2plane1,
890
                              yuv2planarX_fn *yuv2planeX,
891
                              yuv2interleavedX_fn *yuv2nv12cX,
892
                              yuv2packed1_fn *yuv2packed1,
893
                              yuv2packed2_fn *yuv2packed2,
894
                              yuv2packedX_fn *yuv2packedX,
895
                              yuv2anyX_fn *yuv2anyX);
896
void ff_sws_init_swscale_ppc(SwsContext *c);
897
void ff_sws_init_swscale_x86(SwsContext *c);
898

899
void ff_hyscale_fast_c(SwsContext *c, int16_t *dst, int dstWidth,
900
                       const uint8_t *src, int srcW, int xInc);
901
void ff_hcscale_fast_c(SwsContext *c, int16_t *dst1, int16_t *dst2,
902
                       int dstWidth, const uint8_t *src1,
903
                       const uint8_t *src2, int srcW, int xInc);
904
int ff_init_hscaler_mmxext(int dstW, int xInc, uint8_t *filterCode,
905
                           int16_t *filter, int32_t *filterPos,
906
                           int numSplits);
907
void ff_hyscale_fast_mmxext(SwsContext *c, int16_t *dst,
908
                            int dstWidth, const uint8_t *src,
909
                            int srcW, int xInc);
910
void ff_hcscale_fast_mmxext(SwsContext *c, int16_t *dst1, int16_t *dst2,
911
                            int dstWidth, const uint8_t *src1,
912
                            const uint8_t *src2, int srcW, int xInc);
913

914
/**
915
 * Allocate and return an SwsContext.
916
 * This is like sws_getContext() but does not perform the init step, allowing
917
 * the user to set additional AVOptions.
918
 *
919
 * @see sws_getContext()
920
 */
921
struct SwsContext *sws_alloc_set_opts(int srcW, int srcH, enum AVPixelFormat srcFormat,
922
                                      int dstW, int dstH, enum AVPixelFormat dstFormat,
923
                                      int flags, const double *param);
924

925
int ff_sws_alphablendaway(SwsContext *c, const uint8_t *src[],
926
                          int srcStride[], int srcSliceY, int srcSliceH,
927
                          uint8_t *dst[], int dstStride[]);
928

929
static inline void fillPlane16(uint8_t *plane, int stride, int width, int height, int y,
930
                               int alpha, int bits, const int big_endian)
931
{
932
    int i, j;
933
    uint8_t *ptr = plane + stride * y;
934
    int v = alpha ? 0xFFFF>>(16-bits) : (1<<(bits-1));
935
    for (i = 0; i < height; i++) {
936
#define FILL(wfunc) \
937
        for (j = 0; j < width; j++) {\
938
            wfunc(ptr+2*j, v);\
939
        }
940
        if (big_endian) {
941
            FILL(AV_WB16);
942
        } else {
943
            FILL(AV_WL16);
944
        }
945
        ptr += stride;
946
    }
947
}
948

949
#define MAX_SLICE_PLANES 4
950

951
/// Slice plane
952
typedef struct SwsPlane
953
{
954
    int available_lines;    ///< max number of lines that can be hold by this plane
955
    int sliceY;             ///< index of first line
956
    int sliceH;             ///< number of lines
957
    uint8_t **line;         ///< line buffer
958
    uint8_t **tmp;          ///< Tmp line buffer used by mmx code
959
} SwsPlane;
960

961
/**
962
 * Struct which defines a slice of an image to be scaled or a output for
963
 * a scaled slice.
964
 * A slice can also be used as intermediate ring buffer for scaling steps.
965
 */
966
typedef struct SwsSlice
967
{
968
    int width;              ///< Slice line width
969
    int h_chr_sub_sample;   ///< horizontal chroma subsampling factor
970
    int v_chr_sub_sample;   ///< vertical chroma subsampling factor
971
    int is_ring;            ///< flag to identify if this slice is a ring buffer
972
    int should_free_lines;  ///< flag to identify if there are dynamic allocated lines
973
    enum AVPixelFormat fmt; ///< planes pixel format
974
    SwsPlane plane[MAX_SLICE_PLANES];   ///< color planes
975
} SwsSlice;
976

977
/**
978
 * Struct which holds all necessary data for processing a slice.
979
 * A processing step can be a color conversion or horizontal/vertical scaling.
980
 */
981
typedef struct SwsFilterDescriptor
982
{
983
    SwsSlice *src;  ///< Source slice
984
    SwsSlice *dst;  ///< Output slice
985

986
    int alpha;      ///< Flag for processing alpha channel
987
    void *instance; ///< Filter instance data
988

989
    /// Function for processing input slice sliceH lines starting from line sliceY
990
    int (*process)(SwsContext *c, struct SwsFilterDescriptor *desc, int sliceY, int sliceH);
991
} SwsFilterDescriptor;
992

993
// warp input lines in the form (src + width*i + j) to slice format (line[i][j])
994
// relative=true means first line src[x][0] otherwise first line is src[x][lum/crh Y]
995
int ff_init_slice_from_src(SwsSlice * s, uint8_t *src[4], int stride[4], int srcW, int lumY, int lumH, int chrY, int chrH, int relative);
996

997
// Initialize scaler filter descriptor chain
998
int ff_init_filters(SwsContext *c);
999

1000
// Free all filter data
1001
int ff_free_filters(SwsContext *c);
1002

1003
/*
1004
 function for applying ring buffer logic into slice s
1005
 It checks if the slice can hold more @lum lines, if yes
1006
 do nothing otherwise remove @lum least used lines.
1007
 It applies the same procedure for @chr lines.
1008
*/
1009
int ff_rotate_slice(SwsSlice *s, int lum, int chr);
1010

1011
/// initializes gamma conversion descriptor
1012
int ff_init_gamma_convert(SwsFilterDescriptor *desc, SwsSlice * src, uint16_t *table);
1013

1014
/// initializes lum pixel format conversion descriptor
1015
int ff_init_desc_fmt_convert(SwsFilterDescriptor *desc, SwsSlice * src, SwsSlice *dst, uint32_t *pal);
1016

1017
/// initializes lum horizontal scaling descriptor
1018
int ff_init_desc_hscale(SwsFilterDescriptor *desc, SwsSlice *src, SwsSlice *dst, uint16_t *filter, int * filter_pos, int filter_size, int xInc);
1019

1020
/// initializes chr pixel format conversion descriptor
1021
int ff_init_desc_cfmt_convert(SwsFilterDescriptor *desc, SwsSlice * src, SwsSlice *dst, uint32_t *pal);
1022

1023
/// initializes chr horizontal scaling descriptor
1024
int ff_init_desc_chscale(SwsFilterDescriptor *desc, SwsSlice *src, SwsSlice *dst, uint16_t *filter, int * filter_pos, int filter_size, int xInc);
1025

1026
int ff_init_desc_no_chr(SwsFilterDescriptor *desc, SwsSlice * src, SwsSlice *dst);
1027

1028
/// initializes vertical scaling descriptors
1029
int ff_init_vscale(SwsContext *c, SwsFilterDescriptor *desc, SwsSlice *src, SwsSlice *dst);
1030

1031
/// setup vertical scaler functions
1032
void ff_init_vscale_pfn(SwsContext *c, yuv2planar1_fn yuv2plane1, yuv2planarX_fn yuv2planeX,
1033
    yuv2interleavedX_fn yuv2nv12cX, yuv2packed1_fn yuv2packed1, yuv2packed2_fn yuv2packed2,
1034
    yuv2packedX_fn yuv2packedX, yuv2anyX_fn yuv2anyX, int use_mmx);
1035

1036
//number of extra lines to process
1037
#define MAX_LINES_AHEAD 4
1038

1039
// enable use of refactored scaler code
1040
#define NEW_FILTER
1041

1042
#endif /* SWSCALE_SWSCALE_INTERNAL_H */
1043

1044
Product

Resources

Company