libswscale/swscale_internal.h

   1 /*
   2  * Copyright (C) 2001-2003 Michael Niedermayer <michaelni@gmx.at>
   3  *
   4  * This file is part of FFmpeg.
   5  *
   6  * FFmpeg is free software; you can redistribute it and/or
   7  * modify it under the terms of the GNU Lesser General Public
   8  * License as published by the Free Software Foundation; either
   9  * version 2.1 of the License, or (at your option) any later version.
  10  *
  11  * FFmpeg is distributed in the hope that it will be useful,
  12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
  13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
  14  * Lesser General Public License for more details.
  15  *
  16  * You should have received a copy of the GNU Lesser General Public
  17  * License along with FFmpeg; if not, write to the Free Software
  18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  19  */
  20
  21 #ifndef SWSCALE_SWSCALE_INTERNAL_H
  22 #define SWSCALE_SWSCALE_INTERNAL_H
  23
  24 #include "config.h"
  25
  26 #if HAVE_ALTIVEC_H
  27 #include <altivec.h>
  28 #endif
  29
  30 #include "libavutil/avutil.h"
  31 #include "libavutil/internal.h"
  32
  33 #define STR(s)         AV_TOSTRING(s) //AV_STRINGIFY is too long
  34
  35 #define MAX_FILTER_SIZE 256
  36
  37 #if ARCH_X86
  38 #define VOFW 5120
  39 #else
  40 #define VOFW 2048 // faster on PPC and not tested on others
  41 #endif
  42
  43 #define VOF  (VOFW*2)
  44
  45 #ifdef WORDS_BIGENDIAN
  46 #define ALT32_CORR (-1)
  47 #else
  48 #define ALT32_CORR   1
  49 #endif
  50
  51 #if ARCH_X86_64
  52 #   define APCK_PTR2 8
  53 #   define APCK_COEF 16
  54 #   define APCK_SIZE 24
  55 #else
  56 #   define APCK_PTR2 4
  57 #   define APCK_COEF 8
  58 #   define APCK_SIZE 16
  59 #endif
  60
  61 struct SwsContext;
  62
  63 typedef int (*SwsFunc)(struct SwsContext *context, uint8_t* src[],
  64                        int srcStride[], int srcSliceY, int srcSliceH,
  65                        uint8_t* dst[], int dstStride[]);
  66
  67 /* This struct should be aligned on at least a 32-byte boundary. */
  68 typedef struct SwsContext{
  69     /**
  70      * info on struct for av_log
  71      */
  72     const AVClass *av_class;
  73
  74     /**
  75      * Note that src, dst, srcStride, dstStride will be copied in the
  76      * sws_scale() wrapper so they can be freely modified here.
  77      */
  78     SwsFunc swScale;
  79     int srcW, srcH, dstH;
  80     int chrSrcW, chrSrcH, chrDstW, chrDstH;
  81     int lumXInc, chrXInc;
  82     int lumYInc, chrYInc;
  83     enum PixelFormat dstFormat, srcFormat;  ///< format 4:2:0 type is always YV12
  84     int origDstFormat, origSrcFormat;       ///< format
  85     int chrSrcHSubSample, chrSrcVSubSample;
  86     int chrIntHSubSample, chrIntVSubSample;
  87     int chrDstHSubSample, chrDstVSubSample;
  88     int vChrDrop;
  89     int sliceDir;
  90     double param[2];
  91
  92     uint32_t pal_yuv[256];
  93     uint32_t pal_rgb[256];
  94
  95     int16_t **lumPixBuf;
  96     int16_t **chrPixBuf;
  97     int16_t **alpPixBuf;
  98     int16_t *hLumFilter;
  99     int16_t *hLumFilterPos;
 100     int16_t *hChrFilter;
 101     int16_t *hChrFilterPos;
 102     int16_t *vLumFilter;
 103     int16_t *vLumFilterPos;
 104     int16_t *vChrFilter;
 105     int16_t *vChrFilterPos;
 106
 107     uint8_t formatConvBuffer[VOF]; //FIXME dynamic allocation, but we have to change a lot of code for this to be useful
 108
 109     int hLumFilterSize;
 110     int hChrFilterSize;
 111     int vLumFilterSize;
 112     int vChrFilterSize;
 113     int vLumBufSize;
 114     int vChrBufSize;
 115
 116     uint8_t *funnyYCode;
 117     uint8_t *funnyUVCode;
 118     int32_t *lumMmx2FilterPos;
 119     int32_t *chrMmx2FilterPos;
 120     int16_t *lumMmx2Filter;
 121     int16_t *chrMmx2Filter;
 122
 123     int canMMX2BeUsed;
 124
 125     int lastInLumBuf;
 126     int lastInChrBuf;
 127     int lumBufIndex;
 128     int chrBufIndex;
 129     int dstY;
 130     int flags;
 131     void * yuvTable;            // pointer to the yuv->rgb table start so it can be freed()
 132     uint8_t * table_rV[256];
 133     uint8_t * table_gU[256];
 134     int    table_gV[256];
 135     uint8_t * table_bU[256];
 136
 137     //Colorspace stuff
 138     int contrast, brightness, saturation;    // for sws_getColorspaceDetails
 139     int srcColorspaceTable[4];
 140     int dstColorspaceTable[4];
 141     int srcRange, dstRange;
 142     int yuv2rgb_y_offset;
 143     int yuv2rgb_y_coeff;
 144     int yuv2rgb_v2r_coeff;
 145     int yuv2rgb_v2g_coeff;
 146     int yuv2rgb_u2g_coeff;
 147     int yuv2rgb_u2b_coeff;
 148
 149 #define RED_DITHER            "0*8"
 150 #define GREEN_DITHER          "1*8"
 151 #define BLUE_DITHER           "2*8"
 152 #define Y_COEFF               "3*8"
 153 #define VR_COEFF              "4*8"
 154 #define UB_COEFF              "5*8"
 155 #define VG_COEFF              "6*8"
 156 #define UG_COEFF              "7*8"
 157 #define Y_OFFSET              "8*8"
 158 #define U_OFFSET              "9*8"
 159 #define V_OFFSET              "10*8"
 160 #define LUM_MMX_FILTER_OFFSET "11*8"
 161 #define CHR_MMX_FILTER_OFFSET "11*8+4*4*256"
 162 #define DSTW_OFFSET           "11*8+4*4*256*2" //do not change, it is hardcoded in the ASM
 163 #define ESP_OFFSET            "11*8+4*4*256*2+8"
 164 #define VROUNDER_OFFSET       "11*8+4*4*256*2+16"
 165 #define U_TEMP                "11*8+4*4*256*2+24"
 166 #define V_TEMP                "11*8+4*4*256*2+32"
 167 #define Y_TEMP                "11*8+4*4*256*2+40"
 168 #define ALP_MMX_FILTER_OFFSET "11*8+4*4*256*2+48"
 169
 170     DECLARE_ALIGNED(8, uint64_t, redDither);
 171     DECLARE_ALIGNED(8, uint64_t, greenDither);
 172     DECLARE_ALIGNED(8, uint64_t, blueDither);
 173
 174     DECLARE_ALIGNED(8, uint64_t, yCoeff);
 175     DECLARE_ALIGNED(8, uint64_t, vrCoeff);
 176     DECLARE_ALIGNED(8, uint64_t, ubCoeff);
 177     DECLARE_ALIGNED(8, uint64_t, vgCoeff);
 178     DECLARE_ALIGNED(8, uint64_t, ugCoeff);
 179     DECLARE_ALIGNED(8, uint64_t, yOffset);
 180     DECLARE_ALIGNED(8, uint64_t, uOffset);
 181     DECLARE_ALIGNED(8, uint64_t, vOffset);
 182     int32_t  lumMmxFilter[4*MAX_FILTER_SIZE];
 183     int32_t  chrMmxFilter[4*MAX_FILTER_SIZE];
 184     int dstW;
 185     DECLARE_ALIGNED(8, uint64_t, esp);
 186     DECLARE_ALIGNED(8, uint64_t, vRounder);
 187     DECLARE_ALIGNED(8, uint64_t, u_temp);
 188     DECLARE_ALIGNED(8, uint64_t, v_temp);
 189     DECLARE_ALIGNED(8, uint64_t, y_temp);
 190     int32_t  alpMmxFilter[4*MAX_FILTER_SIZE];
 191
 192 #if HAVE_ALTIVEC
 193   vector signed short   CY;
 194   vector signed short   CRV;
 195   vector signed short   CBU;
 196   vector signed short   CGU;
 197   vector signed short   CGV;
 198   vector signed short   OY;
 199   vector unsigned short CSHIFT;
 200   vector signed short   *vYCoeffsBank, *vCCoeffsBank;
 201 #endif
 202
 203 #if ARCH_BFIN
 204     DECLARE_ALIGNED(4, uint32_t, oy);
 205     DECLARE_ALIGNED(4, uint32_t, oc);
 206     DECLARE_ALIGNED(4, uint32_t, zero);
 207     DECLARE_ALIGNED(4, uint32_t, cy);
 208     DECLARE_ALIGNED(4, uint32_t, crv);
 209     DECLARE_ALIGNED(4, uint32_t, rmask);
 210     DECLARE_ALIGNED(4, uint32_t, cbu);
 211     DECLARE_ALIGNED(4, uint32_t, bmask);
 212     DECLARE_ALIGNED(4, uint32_t, cgu);
 213     DECLARE_ALIGNED(4, uint32_t, cgv);
 214     DECLARE_ALIGNED(4, uint32_t, gmask);
 215 #endif
 216
 217 #if HAVE_VIS
 218     DECLARE_ALIGNED(8, uint64_t, sparc_coeffs[10]);
 219 #endif
 220
 221     /* function pointers for swScale() */
 222     void (*yuv2nv12X  )(struct SwsContext *c,
 223                         const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
 224                         const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
 225                         uint8_t *dest, uint8_t *uDest,
 226                         int dstW, int chrDstW, int dstFormat);
 227     void (*yuv2yuv1   )(struct SwsContext *c,
 228                         const int16_t *lumSrc, const int16_t *chrSrc, const int16_t *alpSrc,
 229                         uint8_t *dest,
 230                         uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
 231                         long dstW, long chrDstW);
 232     void (*yuv2yuvX   )(struct SwsContext *c,
 233                         const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
 234                         const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
 235                         const int16_t **alpSrc,
 236                         uint8_t *dest,
 237                         uint8_t *uDest, uint8_t *vDest, uint8_t *aDest,
 238                         long dstW, long chrDstW);
 239     void (*yuv2packed1)(struct SwsContext *c,
 240                         const uint16_t *buf0,
 241                         const uint16_t *uvbuf0, const uint16_t *uvbuf1,
 242                         const uint16_t *abuf0,
 243                         uint8_t *dest,
 244                         int dstW, int uvalpha, int dstFormat, int flags, int y);
 245     void (*yuv2packed2)(struct SwsContext *c,
 246                         const uint16_t *buf0, const uint16_t *buf1,
 247                         const uint16_t *uvbuf0, const uint16_t *uvbuf1,
 248                         const uint16_t *abuf0, const uint16_t *abuf1,
 249                         uint8_t *dest,
 250                         int dstW, int yalpha, int uvalpha, int y);
 251     void (*yuv2packedX)(struct SwsContext *c,
 252                         const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize,
 253                         const int16_t *chrFilter, const int16_t **chrSrc, int chrFilterSize,
 254                         const int16_t **alpSrc, uint8_t *dest,
 255                         long dstW, long dstY);
 256
 257     void (*hyscale_internal)(uint8_t *dst, const uint8_t *src,
 258                              long width, uint32_t *pal);
 259     void (*hascale_internal)(uint8_t *dst, const uint8_t *src,
 260                              long width, uint32_t *pal);
 261     void (*hcscale_internal)(uint8_t *dstU, uint8_t *dstV,
 262                              const uint8_t *src1, const uint8_t *src2,
 263                              long width, uint32_t *pal);
 264     void (*hyscale_fast)(struct SwsContext *c,
 265                          int16_t *dst, int dstWidth,
 266                          const uint8_t *src, int srcW, int xInc);
 267     void (*hcscale_fast)(struct SwsContext *c,
 268                          int16_t *dst, int dstWidth,
 269                          const uint8_t *src1, const uint8_t *src2,
 270                          int srcW, int xInc);
 271
 272     void (*hScale)(int16_t *dst, int dstW, const uint8_t *src, int srcW,
 273                    int xInc, const int16_t *filter, const int16_t *filterPos,
 274                    long filterSize);
 275
 276 } SwsContext;
 277 //FIXME check init (where 0)
 278
 279 SwsFunc ff_yuv2rgb_get_func_ptr(SwsContext *c);
 280 int ff_yuv2rgb_c_init_tables(SwsContext *c, const int inv_table[4],
 281                              int fullRange, int brightness,
 282                              int contrast, int saturation);
 283
 284 void ff_yuv2rgb_init_tables_altivec(SwsContext *c, const int inv_table[4],
 285                                     int brightness, int contrast, int saturation);
 286 SwsFunc ff_yuv2rgb_init_mmx(SwsContext *c);
 287 SwsFunc ff_yuv2rgb_init_vis(SwsContext *c);
 288 SwsFunc ff_yuv2rgb_init_mlib(SwsContext *c);
 289 SwsFunc ff_yuv2rgb_init_altivec(SwsContext *c);
 290 SwsFunc ff_yuv2rgb_get_func_ptr_bfin(SwsContext *c);
 291 void ff_bfin_get_unscaled_swscale(SwsContext *c);
 292 void ff_yuv2packedX_altivec(SwsContext *c,
 293                             const int16_t *lumFilter, int16_t **lumSrc, int lumFilterSize,
 294                             const int16_t *chrFilter, int16_t **chrSrc, int chrFilterSize,
 295                             uint8_t *dest, int dstW, int dstY);
 296
 297 const char *sws_format_name(int format);
 298
 299 //FIXME replace this with something faster
 300 #define is16BPS(x)      (           \
 301            (x)==PIX_FMT_GRAY16BE    \
 302         || (x)==PIX_FMT_GRAY16LE    \
 303         || (x)==PIX_FMT_RGB48BE     \
 304         || (x)==PIX_FMT_RGB48LE     \
 305         || (x)==PIX_FMT_YUV420PLE   \
 306         || (x)==PIX_FMT_YUV422PLE   \
 307         || (x)==PIX_FMT_YUV444PLE   \
 308         || (x)==PIX_FMT_YUV420PBE   \
 309         || (x)==PIX_FMT_YUV422PBE   \
 310         || (x)==PIX_FMT_YUV444PBE   \
 311     )
 312 #define isBE(x) ((x)&1)
 313 #define isPlanar8YUV(x) (           \
 314            (x)==PIX_FMT_YUV410P     \
 315         || (x)==PIX_FMT_YUV420P     \
 316         || (x)==PIX_FMT_YUVA420P    \
 317         || (x)==PIX_FMT_YUV411P     \
 318         || (x)==PIX_FMT_YUV422P     \
 319         || (x)==PIX_FMT_YUV444P     \
 320         || (x)==PIX_FMT_YUV440P     \
 321         || (x)==PIX_FMT_NV12        \
 322         || (x)==PIX_FMT_NV21        \
 323     )
 324 #define isPlanarYUV(x)  (           \
 325         isPlanar8YUV(x)             \
 326         || (x)==PIX_FMT_YUV420PLE   \
 327         || (x)==PIX_FMT_YUV422PLE   \
 328         || (x)==PIX_FMT_YUV444PLE   \
 329         || (x)==PIX_FMT_YUV420PBE   \
 330         || (x)==PIX_FMT_YUV422PBE   \
 331         || (x)==PIX_FMT_YUV444PBE   \
 332     )
 333 #define isYUV(x)        (           \
 334            (x)==PIX_FMT_UYVY422     \
 335         || (x)==PIX_FMT_YUYV422     \
 336         || isPlanarYUV(x)           \
 337     )
 338 #define isGray(x)       (           \
 339            (x)==PIX_FMT_GRAY8       \
 340         || (x)==PIX_FMT_GRAY16BE    \
 341         || (x)==PIX_FMT_GRAY16LE    \
 342     )
 343 #define isGray16(x)     (           \
 344            (x)==PIX_FMT_GRAY16BE    \
 345         || (x)==PIX_FMT_GRAY16LE    \
 346     )
 347 #define isRGB(x)        (           \
 348            (x)==PIX_FMT_RGB48BE     \
 349         || (x)==PIX_FMT_RGB48LE     \
 350         || (x)==PIX_FMT_RGB32       \
 351         || (x)==PIX_FMT_RGB32_1     \
 352         || (x)==PIX_FMT_RGB24       \
 353         || (x)==PIX_FMT_RGB565      \
 354         || (x)==PIX_FMT_RGB555      \
 355         || (x)==PIX_FMT_RGB8        \
 356         || (x)==PIX_FMT_RGB4        \
 357         || (x)==PIX_FMT_RGB4_BYTE   \
 358         || (x)==PIX_FMT_MONOBLACK   \
 359         || (x)==PIX_FMT_MONOWHITE   \
 360     )
 361 #define isBGR(x)        (           \
 362            (x)==PIX_FMT_BGR32       \
 363         || (x)==PIX_FMT_BGR32_1     \
 364         || (x)==PIX_FMT_BGR24       \
 365         || (x)==PIX_FMT_BGR565      \
 366         || (x)==PIX_FMT_BGR555      \
 367         || (x)==PIX_FMT_BGR8        \
 368         || (x)==PIX_FMT_BGR4        \
 369         || (x)==PIX_FMT_BGR4_BYTE   \
 370         || (x)==PIX_FMT_MONOBLACK   \
 371         || (x)==PIX_FMT_MONOWHITE   \
 372     )
 373 #define isALPHA(x)      (           \
 374            (x)==PIX_FMT_BGR32       \
 375         || (x)==PIX_FMT_BGR32_1     \
 376         || (x)==PIX_FMT_RGB32       \
 377         || (x)==PIX_FMT_RGB32_1     \
 378         || (x)==PIX_FMT_YUVA420P    \
 379     )
 380
 381 static inline int fmt_depth(int fmt)
 382 {
 383     switch(fmt) {
 384         case PIX_FMT_RGB48BE:
 385         case PIX_FMT_RGB48LE:
 386             return 48;
 387         case PIX_FMT_BGRA:
 388         case PIX_FMT_ABGR:
 389         case PIX_FMT_RGBA:
 390         case PIX_FMT_ARGB:
 391             return 32;
 392         case PIX_FMT_BGR24:
 393         case PIX_FMT_RGB24:
 394             return 24;
 395         case PIX_FMT_BGR565:
 396         case PIX_FMT_RGB565:
 397         case PIX_FMT_GRAY16BE:
 398         case PIX_FMT_GRAY16LE:
 399             return 16;
 400         case PIX_FMT_BGR555:
 401         case PIX_FMT_RGB555:
 402             return 15;
 403         case PIX_FMT_BGR8:
 404         case PIX_FMT_RGB8:
 405             return 8;
 406         case PIX_FMT_BGR4:
 407         case PIX_FMT_RGB4:
 408         case PIX_FMT_BGR4_BYTE:
 409         case PIX_FMT_RGB4_BYTE:
 410             return 4;
 411         case PIX_FMT_MONOBLACK:
 412         case PIX_FMT_MONOWHITE:
 413             return 1;
 414         default:
 415             return 0;
 416     }
 417 }
 418
 419 extern const uint64_t ff_dither4[2];
 420 extern const uint64_t ff_dither8[2];
 421
 422 extern const AVClass sws_context_class;
 423
 424 #endif /* SWSCALE_SWSCALE_INTERNAL_H */