doxygen/4.0/output_8c_source.html

 /*

  * Copyright (C) 2001-2012 Michael Niedermayer <michaelni@gmx.at>

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 #include <math.h>

 #include <stdint.h>

 #include <stdio.h>

 #include <string.h>


 #include "libavutil/attributes.h"

 #include "libavutil/avutil.h"

 #include "libavutil/avassert.h"

 #include "libavutil/bswap.h"

 #include "libavutil/cpu.h"

 #include "libavutil/intreadwrite.h"

 #include "libavutil/mathematics.h"

 #include "libavutil/pixdesc.h"

 #include "config.h"

 #include "rgb2rgb.h"

 #include "swscale.h"

 #include "swscale_internal.h"


 DECLARE_ALIGNED(8, const uint8_t, ff_dither_2x2_4)[][8] = {

 {  1,   3,   1,   3,   1,   3,   1,   3, },

 {  2,   0,   2,   0,   2,   0,   2,   0, },

 {  1,   3,   1,   3,   1,   3,   1,   3, },

 };


 DECLARE_ALIGNED(8, const uint8_t, ff_dither_2x2_8)[][8] = {

 {  6,   2,   6,   2,   6,   2,   6,   2, },

 {  0,   4,   0,   4,   0,   4,   0,   4, },

 {  6,   2,   6,   2,   6,   2,   6,   2, },

 };


 DECLARE_ALIGNED(8, const uint8_t, ff_dither_4x4_16)[][8] = {

 {  8,   4,  11,   7,   8,   4,  11,   7, },

 {  2,  14,   1,  13,   2,  14,   1,  13, },

 { 10,   6,   9,   5,  10,   6,   9,   5, },

 {  0,  12,   3,  15,   0,  12,   3,  15, },

 {  8,   4,  11,   7,   8,   4,  11,   7, },

 };


 DECLARE_ALIGNED(8, const uint8_t, ff_dither_8x8_32)[][8] = {

 { 17,   9,  23,  15,  16,   8,  22,  14, },

 {  5,  29,   3,  27,   4,  28,   2,  26, },

 { 21,  13,  19,  11,  20,  12,  18,  10, },

 {  0,  24,   6,  30,   1,  25,   7,  31, },

 { 16,   8,  22,  14,  17,   9,  23,  15, },

 {  4,  28,   2,  26,   5,  29,   3,  27, },

 { 20,  12,  18,  10,  21,  13,  19,  11, },

 {  1,  25,   7,  31,   0,  24,   6,  30, },

 { 17,   9,  23,  15,  16,   8,  22,  14, },

 };


 DECLARE_ALIGNED(8, const uint8_t, ff_dither_8x8_73)[][8] = {

 {  0,  55,  14,  68,   3,  58,  17,  72, },

 { 37,  18,  50,  32,  40,  22,  54,  35, },

 {  9,  64,   5,  59,  13,  67,   8,  63, },

 { 46,  27,  41,  23,  49,  31,  44,  26, },

 {  2,  57,  16,  71,   1,  56,  15,  70, },

 { 39,  21,  52,  34,  38,  19,  51,  33, },

 { 11,  66,   7,  62,  10,  65,   6,  60, },

 { 48,  30,  43,  25,  47,  29,  42,  24, },

 {  0,  55,  14,  68,   3,  58,  17,  72, },

 };


 #if 1

 DECLARE_ALIGNED(8, const uint8_t, ff_dither_8x8_220)[][8] = {

 {117,  62, 158, 103, 113,  58, 155, 100, },

 { 34, 199,  21, 186,  31, 196,  17, 182, },

 {144,  89, 131,  76, 141,  86, 127,  72, },

 {  0, 165,  41, 206,  10, 175,  52, 217, },

 {110,  55, 151,  96, 120,  65, 162, 107, },

 { 28, 193,  14, 179,  38, 203,  24, 189, },

 {138,  83, 124,  69, 148,  93, 134,  79, },

 {  7, 172,  48, 213,   3, 168,  45, 210, },

 {117,  62, 158, 103, 113,  58, 155, 100, },

 };

 #elif 1

 // tries to correct a gamma of 1.5

 DECLARE_ALIGNED(8, const uint8_t, ff_dither_8x8_220)[][8] = {

 {  0, 143,  18, 200,   2, 156,  25, 215, },

 { 78,  28, 125,  64,  89,  36, 138,  74, },

 { 10, 180,   3, 161,  16, 195,   8, 175, },

 {109,  51,  93,  38, 121,  60, 105,  47, },

 {  1, 152,  23, 210,   0, 147,  20, 205, },

 { 85,  33, 134,  71,  81,  30, 130,  67, },

 { 14, 190,   6, 171,  12, 185,   5, 166, },

 {117,  57, 101,  44, 113,  54,  97,  41, },

 {  0, 143,  18, 200,   2, 156,  25, 215, },

 };

 #elif 1

 // tries to correct a gamma of 2.0

 DECLARE_ALIGNED(8, const uint8_t, ff_dither_8x8_220)[][8] = {

 {  0, 124,   8, 193,   0, 140,  12, 213, },

 { 55,  14, 104,  42,  66,  19, 119,  52, },

 {  3, 168,   1, 145,   6, 187,   3, 162, },

 { 86,  31,  70,  21,  99,  39,  82,  28, },

 {  0, 134,  11, 206,   0, 129,   9, 200, },

 { 62,  17, 114,  48,  58,  16, 109,  45, },

 {  5, 181,   2, 157,   4, 175,   1, 151, },

 { 95,  36,  78,  26,  90,  34,  74,  24, },

 {  0, 124,   8, 193,   0, 140,  12, 213, },

 };

 #else

 // tries to correct a gamma of 2.5

 DECLARE_ALIGNED(8, const uint8_t, ff_dither_8x8_220)[][8] = {

 {  0, 107,   3, 187,   0, 125,   6, 212, },

 { 39,   7,  86,  28,  49,  11, 102,  36, },

 {  1, 158,   0, 131,   3, 180,   1, 151, },

 { 68,  19,  52,  12,  81,  25,  64,  17, },

 {  0, 119,   5, 203,   0, 113,   4, 195, },

 { 45,   9,  96,  33,  42,   8,  91,  30, },

 {  2, 172,   1, 144,   2, 165,   0, 137, },

 { 77,  23,  60,  15,  72,  21,  56,  14, },

 {  0, 107,   3, 187,   0, 125,   6, 212, },

 };

 #endif


 #define output_pixel(pos, val, bias, signedness) \

     if (big_endian) { \

         AV_WB16(pos, bias + av_clip_ ## signedness ## 16(val >> shift)); \

     } else { \

         AV_WL16(pos, bias + av_clip_ ## signedness ## 16(val >> shift)); \

     }


 static av_always_inline void

 yuv2plane1_16_c_template(const int32_t *src, uint16_t *dest, int dstW,

                          int big_endian, int output_bits)

 {

     int i;

     int shift = 3;

     av_assert0(output_bits == 16);


     for (i = 0; i < dstW; i++) {

         int val = src[i] + (1 << (shift - 1));

         output_pixel(&dest[i], val, 0, uint);

     }

 }


 static av_always_inline void

 yuv2planeX_16_c_template(const int16_t *filter, int filterSize,

                          const int32_t **src, uint16_t *dest, int dstW,

                          int big_endian, int output_bits)

 {

     int i;

     int shift = 15;

     av_assert0(output_bits == 16);


     for (i = 0; i < dstW; i++) {

         int val = 1 << (shift - 1);

         int j;


         /* range of val is [0,0x7FFFFFFF], so 31 bits, but with lanczos/spline

          * filters (or anything with negative coeffs, the range can be slightly

          * wider in both directions. To account for this overflow, we subtract

          * a constant so it always fits in the signed range (assuming a

          * reasonable filterSize), and re-add that at the end. */

         val -= 0x40000000;

         for (j = 0; j < filterSize; j++)

             val += src[j][i] * (unsigned)filter[j];


         output_pixel(&dest[i], val, 0x8000, int);

     }

 }


 static void yuv2p016cX_c(SwsContext *c, const int16_t *chrFilter, int chrFilterSize,

                          const int16_t **chrUSrc, const int16_t **chrVSrc,

                          uint8_t *dest8, int chrDstW)

 {

     uint16_t *dest = (uint16_t*)dest8;

     const int32_t **uSrc = (const int32_t **)chrUSrc;

     const int32_t **vSrc = (const int32_t **)chrVSrc;

     int shift = 15;

     int big_endian = c->dstFormat == AV_PIX_FMT_P016BE;

     int i, j;


     for (i = 0; i < chrDstW; i++) {

         int u = 1 << (shift - 1);

         int v = 1 << (shift - 1);


         /* See yuv2planeX_16_c_template for details. */

         u -= 0x40000000;

         v -= 0x40000000;

         for (j = 0; j < chrFilterSize; j++) {

             u += uSrc[j][i] * (unsigned)chrFilter[j];

             v += vSrc[j][i] * (unsigned)chrFilter[j];

         }


         output_pixel(&dest[2*i]  , u, 0x8000, int);

         output_pixel(&dest[2*i+1], v, 0x8000, int);

     }

 }


 #undef output_pixel


 #define output_pixel(pos, val) \

     if (big_endian) { \

         AV_WB16(pos, av_clip_uintp2(val >> shift, output_bits)); \

     } else { \

         AV_WL16(pos, av_clip_uintp2(val >> shift, output_bits)); \

     }


 static av_always_inline void

 yuv2plane1_10_c_template(const int16_t *src, uint16_t *dest, int dstW,

                          int big_endian, int output_bits)

 {

     int i;

     int shift = 15 - output_bits;


     for (i = 0; i < dstW; i++) {

         int val = src[i] + (1 << (shift - 1));

         output_pixel(&dest[i], val);

     }

 }


 static av_always_inline void

 yuv2planeX_10_c_template(const int16_t *filter, int filterSize,

                          const int16_t **src, uint16_t *dest, int dstW,

                          int big_endian, int output_bits)

 {

     int i;

     int shift = 11 + 16 - output_bits;


     for (i = 0; i < dstW; i++) {

         int val = 1 << (shift - 1);

         int j;


         for (j = 0; j < filterSize; j++)

             val += src[j][i] * filter[j];


         output_pixel(&dest[i], val);

     }

 }


 #undef output_pixel


 #define yuv2NBPS(bits, BE_LE, is_be, template_size, typeX_t) \

 static void yuv2plane1_ ## bits ## BE_LE ## _c(const int16_t *src, \

                               uint8_t *dest, int dstW, \

                               const uint8_t *dither, int offset)\

 { \

     yuv2plane1_ ## template_size ## _c_template((const typeX_t *) src, \

                          (uint16_t *) dest, dstW, is_be, bits); \

 }\

 static void yuv2planeX_ ## bits ## BE_LE ## _c(const int16_t *filter, int filterSize, \

                               const int16_t **src, uint8_t *dest, int dstW, \

                               const uint8_t *dither, int offset)\

 { \

     yuv2planeX_## template_size ## _c_template(filter, \

                          filterSize, (const typeX_t **) src, \

                          (uint16_t *) dest, dstW, is_be, bits); \

 }

 yuv2NBPS( 9, BE, 1, 10, int16_t)

 yuv2NBPS( 9, LE, 0, 10, int16_t)

 yuv2NBPS(10, BE, 1, 10, int16_t)

 yuv2NBPS(10, LE, 0, 10, int16_t)

 yuv2NBPS(12, BE, 1, 10, int16_t)

 yuv2NBPS(12, LE, 0, 10, int16_t)

 yuv2NBPS(14, BE, 1, 10, int16_t)

 yuv2NBPS(14, LE, 0, 10, int16_t)

 yuv2NBPS(16, BE, 1, 16, int32_t)

 yuv2NBPS(16, LE, 0, 16, int32_t)


 static void yuv2planeX_8_c(const int16_t *filter, int filterSize,

                            const int16_t **src, uint8_t *dest, int dstW,

                            const uint8_t *dither, int offset)

 {

     int i;

     for (i=0; i<dstW; i++) {

         int val = dither[(i + offset) & 7] << 12;

         int j;

         for (j=0; j<filterSize; j++)

             val += src[j][i] * filter[j];


         dest[i]= av_clip_uint8(val>>19);

     }

 }


 static void yuv2plane1_8_c(const int16_t *src, uint8_t *dest, int dstW,

                            const uint8_t *dither, int offset)

 {

     int i;

     for (i=0; i<dstW; i++) {

         int val = (src[i] + dither[(i + offset) & 7]) >> 7;

         dest[i]= av_clip_uint8(val);

     }

 }


 static void yuv2nv12cX_c(SwsContext *c, const int16_t *chrFilter, int chrFilterSize,

                         const int16_t **chrUSrc, const int16_t **chrVSrc,

                         uint8_t *dest, int chrDstW)

 {

     enum AVPixelFormat dstFormat = c->dstFormat;

     const uint8_t *chrDither = c->chrDither8;

     int i;


     if (dstFormat == AV_PIX_FMT_NV12)

         for (i=0; i<chrDstW; i++) {

             int u = chrDither[i & 7] << 12;

             int v = chrDither[(i + 3) & 7] << 12;

             int j;

             for (j=0; j<chrFilterSize; j++) {

                 u += chrUSrc[j][i] * chrFilter[j];

                 v += chrVSrc[j][i] * chrFilter[j];

             }


             dest[2*i]= av_clip_uint8(u>>19);

             dest[2*i+1]= av_clip_uint8(v>>19);

         }

     else

         for (i=0; i<chrDstW; i++) {

             int u = chrDither[i & 7] << 12;

             int v = chrDither[(i + 3) & 7] << 12;

             int j;

             for (j=0; j<chrFilterSize; j++) {

                 u += chrUSrc[j][i] * chrFilter[j];

                 v += chrVSrc[j][i] * chrFilter[j];

             }


             dest[2*i]= av_clip_uint8(v>>19);

             dest[2*i+1]= av_clip_uint8(u>>19);

         }

 }


 #define output_pixel(pos, val) \

     if (big_endian) { \

         AV_WB16(pos, av_clip_uintp2(val >> shift, 10) << 6); \

     } else { \

         AV_WL16(pos, av_clip_uintp2(val >> shift, 10) << 6); \

     }


 static void yuv2p010l1_c(const int16_t *src,

                          uint16_t *dest, int dstW,

                          int big_endian)

 {

     int i;

     int shift = 5;


     for (i = 0; i < dstW; i++) {

         int val = src[i] + (1 << (shift - 1));

         output_pixel(&dest[i], val);

     }

 }


 static void yuv2p010lX_c(const int16_t *filter, int filterSize,

                          const int16_t **src, uint16_t *dest, int dstW,

                          int big_endian)

 {

     int i, j;

     int shift = 17;


     for (i = 0; i < dstW; i++) {

         int val = 1 << (shift - 1);


         for (j = 0; j < filterSize; j++)

             val += src[j][i] * filter[j];


         output_pixel(&dest[i], val);

     }

 }


 static void yuv2p010cX_c(SwsContext *c, const int16_t *chrFilter, int chrFilterSize,

                          const int16_t **chrUSrc, const int16_t **chrVSrc,

                          uint8_t *dest8, int chrDstW)

 {

     uint16_t *dest = (uint16_t*)dest8;

     int shift = 17;

     int big_endian = c->dstFormat == AV_PIX_FMT_P010BE;

     int i, j;


     for (i = 0; i < chrDstW; i++) {

         int u = 1 << (shift - 1);

         int v = 1 << (shift - 1);


         for (j = 0; j < chrFilterSize; j++) {

             u += chrUSrc[j][i] * chrFilter[j];

             v += chrVSrc[j][i] * chrFilter[j];

         }


         output_pixel(&dest[2*i]  , u);

         output_pixel(&dest[2*i+1], v);

     }

 }


 static void yuv2p010l1_LE_c(const int16_t *src,

                             uint8_t *dest, int dstW,

                             const uint8_t *dither, int offset)

 {

     yuv2p010l1_c(src, (uint16_t*)dest, dstW, 0);

 }


 static void yuv2p010l1_BE_c(const int16_t *src,

                             uint8_t *dest, int dstW,

                             const uint8_t *dither, int offset)

 {

     yuv2p010l1_c(src, (uint16_t*)dest, dstW, 1);

 }


 static void yuv2p010lX_LE_c(const int16_t *filter, int filterSize,

                             const int16_t **src, uint8_t *dest, int dstW,

                             const uint8_t *dither, int offset)

 {

     yuv2p010lX_c(filter, filterSize, src, (uint16_t*)dest, dstW, 0);

 }


 static void yuv2p010lX_BE_c(const int16_t *filter, int filterSize,

                             const int16_t **src, uint8_t *dest, int dstW,

                             const uint8_t *dither, int offset)

 {

     yuv2p010lX_c(filter, filterSize, src, (uint16_t*)dest, dstW, 1);

 }


 #undef output_pixel


 #define accumulate_bit(acc, val) \

     acc <<= 1; \

     acc |= (val) >= 234

 #define output_pixel(pos, acc) \

     if (target == AV_PIX_FMT_MONOBLACK) { \

         pos = acc; \

     } else { \

         pos = ~acc; \

     }


 static av_always_inline void

 yuv2mono_X_c_template(SwsContext *c, const int16_t *lumFilter,

                       const int16_t **lumSrc, int lumFilterSize,

                       const int16_t *chrFilter, const int16_t **chrUSrc,

                       const int16_t **chrVSrc, int chrFilterSize,

                       const int16_t **alpSrc, uint8_t *dest, int dstW,

                       int y, enum AVPixelFormat target)

 {

     const uint8_t * const d128 = ff_dither_8x8_220[y&7];

     int i;

     unsigned acc = 0;

     int err = 0;


     for (i = 0; i < dstW; i += 2) {

         int j;

         int Y1 = 1 << 18;

         int Y2 = 1 << 18;


         for (j = 0; j < lumFilterSize; j++) {

             Y1 += lumSrc[j][i]   * lumFilter[j];

             Y2 += lumSrc[j][i+1] * lumFilter[j];

         }

         Y1 >>= 19;

         Y2 >>= 19;

         if ((Y1 | Y2) & 0x100) {

             Y1 = av_clip_uint8(Y1);

             Y2 = av_clip_uint8(Y2);

         }

         if (c->dither == SWS_DITHER_ED) {

             Y1 += (7*err + 1*c->dither_error[0][i] + 5*c->dither_error[0][i+1] + 3*c->dither_error[0][i+2] + 8 - 256)>>4;

             c->dither_error[0][i] = err;

             acc = 2*acc + (Y1 >= 128);

             Y1 -= 220*(acc&1);


             err = Y2 + ((7*Y1 + 1*c->dither_error[0][i+1] + 5*c->dither_error[0][i+2] + 3*c->dither_error[0][i+3] + 8 - 256)>>4);

             c->dither_error[0][i+1] = Y1;

             acc = 2*acc + (err >= 128);

             err -= 220*(acc&1);

         } else {

             accumulate_bit(acc, Y1 + d128[(i + 0) & 7]);

             accumulate_bit(acc, Y2 + d128[(i + 1) & 7]);

         }

         if ((i & 7) == 6) {

             output_pixel(*dest++, acc);

         }

     }

     c->dither_error[0][i] = err;


     if (i & 6) {

         output_pixel(*dest, acc);

     }

 }


 static av_always_inline void

 yuv2mono_2_c_template(SwsContext *c, const int16_t *buf[2],

                       const int16_t *ubuf[2], const int16_t *vbuf[2],

                       const int16_t *abuf[2], uint8_t *dest, int dstW,

                       int yalpha, int uvalpha, int y,

                       enum AVPixelFormat target)

 {

     const int16_t *buf0  = buf[0],  *buf1  = buf[1];

     const uint8_t * const d128 = ff_dither_8x8_220[y & 7];

     int  yalpha1 = 4096 - yalpha;

     int i;

     av_assert2(yalpha  <= 4096U);


     if (c->dither == SWS_DITHER_ED) {

         int err = 0;

         int acc = 0;

         for (i = 0; i < dstW; i +=2) {

             int Y;


             Y = (buf0[i + 0] * yalpha1 + buf1[i + 0] * yalpha) >> 19;

             Y += (7*err + 1*c->dither_error[0][i] + 5*c->dither_error[0][i+1] + 3*c->dither_error[0][i+2] + 8 - 256)>>4;

             c->dither_error[0][i] = err;

             acc = 2*acc + (Y >= 128);

             Y -= 220*(acc&1);


             err = (buf0[i + 1] * yalpha1 + buf1[i + 1] * yalpha) >> 19;

             err += (7*Y + 1*c->dither_error[0][i+1] + 5*c->dither_error[0][i+2] + 3*c->dither_error[0][i+3] + 8 - 256)>>4;

             c->dither_error[0][i+1] = Y;

             acc = 2*acc + (err >= 128);

             err -= 220*(acc&1);


             if ((i & 7) == 6)

                 output_pixel(*dest++, acc);

         }

         c->dither_error[0][i] = err;

     } else {

     for (i = 0; i < dstW; i += 8) {

         int Y, acc = 0;


         Y = (buf0[i + 0] * yalpha1 + buf1[i + 0] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[0]);

         Y = (buf0[i + 1] * yalpha1 + buf1[i + 1] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[1]);

         Y = (buf0[i + 2] * yalpha1 + buf1[i + 2] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[2]);

         Y = (buf0[i + 3] * yalpha1 + buf1[i + 3] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[3]);

         Y = (buf0[i + 4] * yalpha1 + buf1[i + 4] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[4]);

         Y = (buf0[i + 5] * yalpha1 + buf1[i + 5] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[5]);

         Y = (buf0[i + 6] * yalpha1 + buf1[i + 6] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[6]);

         Y = (buf0[i + 7] * yalpha1 + buf1[i + 7] * yalpha) >> 19;

         accumulate_bit(acc, Y + d128[7]);


         output_pixel(*dest++, acc);

     }

     }

 }


 static av_always_inline void

 yuv2mono_1_c_template(SwsContext *c, const int16_t *buf0,

                       const int16_t *ubuf[2], const int16_t *vbuf[2],

                       const int16_t *abuf0, uint8_t *dest, int dstW,

                       int uvalpha, int y, enum AVPixelFormat target)

 {

     const uint8_t * const d128 = ff_dither_8x8_220[y & 7];

     int i;


     if (c->dither == SWS_DITHER_ED) {

         int err = 0;

         int acc = 0;

         for (i = 0; i < dstW; i +=2) {

             int Y;


             Y = ((buf0[i + 0] + 64) >> 7);

             Y += (7*err + 1*c->dither_error[0][i] + 5*c->dither_error[0][i+1] + 3*c->dither_error[0][i+2] + 8 - 256)>>4;

             c->dither_error[0][i] = err;

             acc = 2*acc + (Y >= 128);

             Y -= 220*(acc&1);


             err = ((buf0[i + 1] + 64) >> 7);

             err += (7*Y + 1*c->dither_error[0][i+1] + 5*c->dither_error[0][i+2] + 3*c->dither_error[0][i+3] + 8 - 256)>>4;

             c->dither_error[0][i+1] = Y;

             acc = 2*acc + (err >= 128);

             err -= 220*(acc&1);


             if ((i & 7) == 6)

                 output_pixel(*dest++, acc);

         }

         c->dither_error[0][i] = err;

     } else {

     for (i = 0; i < dstW; i += 8) {

         int acc = 0;

         accumulate_bit(acc, ((buf0[i + 0] + 64) >> 7) + d128[0]);

         accumulate_bit(acc, ((buf0[i + 1] + 64) >> 7) + d128[1]);

         accumulate_bit(acc, ((buf0[i + 2] + 64) >> 7) + d128[2]);

         accumulate_bit(acc, ((buf0[i + 3] + 64) >> 7) + d128[3]);

         accumulate_bit(acc, ((buf0[i + 4] + 64) >> 7) + d128[4]);

         accumulate_bit(acc, ((buf0[i + 5] + 64) >> 7) + d128[5]);

         accumulate_bit(acc, ((buf0[i + 6] + 64) >> 7) + d128[6]);

         accumulate_bit(acc, ((buf0[i + 7] + 64) >> 7) + d128[7]);


         output_pixel(*dest++, acc);

     }

     }

 }


 #undef output_pixel

 #undef accumulate_bit


 #define YUV2PACKEDWRAPPER(name, base, ext, fmt) \

 static void name ## ext ## _X_c(SwsContext *c, const int16_t *lumFilter, \

                                 const int16_t **lumSrc, int lumFilterSize, \

                                 const int16_t *chrFilter, const int16_t **chrUSrc, \

                                 const int16_t **chrVSrc, int chrFilterSize, \

                                 const int16_t **alpSrc, uint8_t *dest, int dstW, \

                                 int y) \

 { \

     name ## base ## _X_c_template(c, lumFilter, lumSrc, lumFilterSize, \

                                   chrFilter, chrUSrc, chrVSrc, chrFilterSize, \

                                   alpSrc, dest, dstW, y, fmt); \

 } \

  \

 static void name ## ext ## _2_c(SwsContext *c, const int16_t *buf[2], \

                                 const int16_t *ubuf[2], const int16_t *vbuf[2], \

                                 const int16_t *abuf[2], uint8_t *dest, int dstW, \

                                 int yalpha, int uvalpha, int y) \

 { \

     name ## base ## _2_c_template(c, buf, ubuf, vbuf, abuf, \

                                   dest, dstW, yalpha, uvalpha, y, fmt); \

 } \

  \

 static void name ## ext ## _1_c(SwsContext *c, const int16_t *buf0, \

                                 const int16_t *ubuf[2], const int16_t *vbuf[2], \

                                 const int16_t *abuf0, uint8_t *dest, int dstW, \

                                 int uvalpha, int y) \

 { \

     name ## base ## _1_c_template(c, buf0, ubuf, vbuf, \

                                   abuf0, dest, dstW, uvalpha, \

                                   y, fmt); \

 }


 YUV2PACKEDWRAPPER(yuv2mono,, white, AV_PIX_FMT_MONOWHITE)

 YUV2PACKEDWRAPPER(yuv2mono,, black, AV_PIX_FMT_MONOBLACK)


 #define output_pixels(pos, Y1, U, Y2, V) \

     if (target == AV_PIX_FMT_YUYV422) { \

         dest[pos + 0] = Y1; \

         dest[pos + 1] = U;  \

         dest[pos + 2] = Y2; \

         dest[pos + 3] = V;  \

     } else if (target == AV_PIX_FMT_YVYU422) { \

         dest[pos + 0] = Y1; \

         dest[pos + 1] = V;  \

         dest[pos + 2] = Y2; \

         dest[pos + 3] = U;  \

     } else { /* AV_PIX_FMT_UYVY422 */ \

         dest[pos + 0] = U;  \

         dest[pos + 1] = Y1; \

         dest[pos + 2] = V;  \

         dest[pos + 3] = Y2; \

     }


 static av_always_inline void

 yuv2422_X_c_template(SwsContext *c, const int16_t *lumFilter,

                      const int16_t **lumSrc, int lumFilterSize,

                      const int16_t *chrFilter, const int16_t **chrUSrc,

                      const int16_t **chrVSrc, int chrFilterSize,

                      const int16_t **alpSrc, uint8_t *dest, int dstW,

                      int y, enum AVPixelFormat target)

 {

     int i;


     for (i = 0; i < ((dstW + 1) >> 1); i++) {

         int j;

         int Y1 = 1 << 18;

         int Y2 = 1 << 18;

         int U  = 1 << 18;

         int V  = 1 << 18;


         for (j = 0; j < lumFilterSize; j++) {

             Y1 += lumSrc[j][i * 2]     * lumFilter[j];

             Y2 += lumSrc[j][i * 2 + 1] * lumFilter[j];

         }

         for (j = 0; j < chrFilterSize; j++) {

             U += chrUSrc[j][i] * chrFilter[j];

             V += chrVSrc[j][i] * chrFilter[j];

         }

         Y1 >>= 19;

         Y2 >>= 19;

         U  >>= 19;

         V  >>= 19;

         if ((Y1 | Y2 | U | V) & 0x100) {

             Y1 = av_clip_uint8(Y1);

             Y2 = av_clip_uint8(Y2);

             U  = av_clip_uint8(U);

             V  = av_clip_uint8(V);

         }

         output_pixels(4*i, Y1, U, Y2, V);

     }

 }


 static av_always_inline void

 yuv2422_2_c_template(SwsContext *c, const int16_t *buf[2],

                      const int16_t *ubuf[2], const int16_t *vbuf[2],

                      const int16_t *abuf[2], uint8_t *dest, int dstW,

                      int yalpha, int uvalpha, int y,

                      enum AVPixelFormat target)

 {

     const int16_t *buf0  = buf[0],  *buf1  = buf[1],

                   *ubuf0 = ubuf[0], *ubuf1 = ubuf[1],

                   *vbuf0 = vbuf[0], *vbuf1 = vbuf[1];

     int  yalpha1 = 4096 - yalpha;

     int uvalpha1 = 4096 - uvalpha;

     int i;

     av_assert2(yalpha  <= 4096U);

     av_assert2(uvalpha <= 4096U);


     for (i = 0; i < ((dstW + 1) >> 1); i++) {

         int Y1 = (buf0[i * 2]     * yalpha1  + buf1[i * 2]     * yalpha)  >> 19;

         int Y2 = (buf0[i * 2 + 1] * yalpha1  + buf1[i * 2 + 1] * yalpha)  >> 19;

         int U  = (ubuf0[i]        * uvalpha1 + ubuf1[i]        * uvalpha) >> 19;

         int V  = (vbuf0[i]        * uvalpha1 + vbuf1[i]        * uvalpha) >> 19;


         if ((Y1 | Y2 | U | V) & 0x100) {

             Y1 = av_clip_uint8(Y1);

             Y2 = av_clip_uint8(Y2);

             U  = av_clip_uint8(U);

             V  = av_clip_uint8(V);

         }


         output_pixels(i * 4, Y1, U, Y2, V);

     }

 }


 static av_always_inline void

 yuv2422_1_c_template(SwsContext *c, const int16_t *buf0,

                      const int16_t *ubuf[2], const int16_t *vbuf[2],

                      const int16_t *abuf0, uint8_t *dest, int dstW,

                      int uvalpha, int y, enum AVPixelFormat target)

 {

     const int16_t *ubuf0 = ubuf[0], *vbuf0 = vbuf[0];

     int i;


     if (uvalpha < 2048) {

         for (i = 0; i < ((dstW + 1) >> 1); i++) {

             int Y1 = (buf0[i * 2    ]+64) >> 7;

             int Y2 = (buf0[i * 2 + 1]+64) >> 7;

             int U  = (ubuf0[i]       +64) >> 7;

             int V  = (vbuf0[i]       +64) >> 7;


             if ((Y1 | Y2 | U | V) & 0x100) {

                 Y1 = av_clip_uint8(Y1);

                 Y2 = av_clip_uint8(Y2);

                 U  = av_clip_uint8(U);

                 V  = av_clip_uint8(V);

             }


             Y1 = av_clip_uint8(Y1);

             Y2 = av_clip_uint8(Y2);

             U  = av_clip_uint8(U);

             V  = av_clip_uint8(V);


             output_pixels(i * 4, Y1, U, Y2, V);

         }

     } else {

         const int16_t *ubuf1 = ubuf[1], *vbuf1 = vbuf[1];

         for (i = 0; i < ((dstW + 1) >> 1); i++) {

             int Y1 = (buf0[i * 2    ]    + 64) >> 7;

             int Y2 = (buf0[i * 2 + 1]    + 64) >> 7;

             int U  = (ubuf0[i] + ubuf1[i]+128) >> 8;

             int V  = (vbuf0[i] + vbuf1[i]+128) >> 8;


             if ((Y1 | Y2 | U | V) & 0x100) {

                 Y1 = av_clip_uint8(Y1);

                 Y2 = av_clip_uint8(Y2);

                 U  = av_clip_uint8(U);

                 V  = av_clip_uint8(V);

             }


             Y1 = av_clip_uint8(Y1);

             Y2 = av_clip_uint8(Y2);

             U  = av_clip_uint8(U);

             V  = av_clip_uint8(V);


             output_pixels(i * 4, Y1, U, Y2, V);

         }

     }

 }


 #undef output_pixels


 YUV2PACKEDWRAPPER(yuv2, 422, yuyv422, AV_PIX_FMT_YUYV422)

 YUV2PACKEDWRAPPER(yuv2, 422, yvyu422, AV_PIX_FMT_YVYU422)

 YUV2PACKEDWRAPPER(yuv2, 422, uyvy422, AV_PIX_FMT_UYVY422)


 #define R_B ((target == AV_PIX_FMT_RGB48LE || target == AV_PIX_FMT_RGB48BE || target == AV_PIX_FMT_RGBA64LE || target == AV_PIX_FMT_RGBA64BE) ? R : B)

 #define B_R ((target == AV_PIX_FMT_RGB48LE || target == AV_PIX_FMT_RGB48BE || target == AV_PIX_FMT_RGBA64LE || target == AV_PIX_FMT_RGBA64BE) ? B : R)

 #define output_pixel(pos, val) \

     if (isBE(target)) { \

         AV_WB16(pos, val); \

     } else { \

         AV_WL16(pos, val); \

     }


 static av_always_inline void

 yuv2rgba64_X_c_template(SwsContext *c, const int16_t *lumFilter,

                        const int32_t **lumSrc, int lumFilterSize,

                        const int16_t *chrFilter, const int32_t **chrUSrc,

                        const int32_t **chrVSrc, int chrFilterSize,

                        const int32_t **alpSrc, uint16_t *dest, int dstW,

                        int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)

 {

     int i;

     int A1 = 0xffff<<14, A2 = 0xffff<<14;


     for (i = 0; i < ((dstW + 1) >> 1); i++) {

         int j;

         int Y1 = -0x40000000;

         int Y2 = -0x40000000;

         int U  = -(128 << 23); // 19

         int V  = -(128 << 23);

         int R, G, B;


         for (j = 0; j < lumFilterSize; j++) {

             Y1 += lumSrc[j][i * 2]     * (unsigned)lumFilter[j];

             Y2 += lumSrc[j][i * 2 + 1] * (unsigned)lumFilter[j];

         }

         for (j = 0; j < chrFilterSize; j++) {;

             U += chrUSrc[j][i] * (unsigned)chrFilter[j];

             V += chrVSrc[j][i] * (unsigned)chrFilter[j];

         }


         if (hasAlpha) {

             A1 = -0x40000000;

             A2 = -0x40000000;

             for (j = 0; j < lumFilterSize; j++) {

                 A1 += alpSrc[j][i * 2]     * (unsigned)lumFilter[j];

                 A2 += alpSrc[j][i * 2 + 1] * (unsigned)lumFilter[j];

             }

             A1 >>= 1;

             A1 += 0x20002000;

             A2 >>= 1;

             A2 += 0x20002000;

         }


         // 8 bits: 12+15=27; 16 bits: 12+19=31

         Y1 >>= 14; // 10

         Y1 += 0x10000;

         Y2 >>= 14;

         Y2 += 0x10000;

         U  >>= 14;

         V  >>= 14;


         // 8 bits: 27 -> 17 bits, 16 bits: 31 - 14 = 17 bits

         Y1 -= c->yuv2rgb_y_offset;

         Y2 -= c->yuv2rgb_y_offset;

         Y1 *= c->yuv2rgb_y_coeff;

         Y2 *= c->yuv2rgb_y_coeff;

         Y1 += 1 << 13; // 21

         Y2 += 1 << 13;

         // 8 bits: 17 + 13 bits = 30 bits, 16 bits: 17 + 13 bits = 30 bits


         R = V * c->yuv2rgb_v2r_coeff;

         G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

         B =                            U * c->yuv2rgb_u2b_coeff;


         // 8 bits: 30 - 22 = 8 bits, 16 bits: 30 bits - 14 = 16 bits

         output_pixel(&dest[0], av_clip_uintp2(R_B + Y1, 30) >> 14);

         output_pixel(&dest[1], av_clip_uintp2(  G + Y1, 30) >> 14);

         output_pixel(&dest[2], av_clip_uintp2(B_R + Y1, 30) >> 14);

         if (eightbytes) {

             output_pixel(&dest[3], av_clip_uintp2(A1      , 30) >> 14);

             output_pixel(&dest[4], av_clip_uintp2(R_B + Y2, 30) >> 14);

             output_pixel(&dest[5], av_clip_uintp2(  G + Y2, 30) >> 14);

             output_pixel(&dest[6], av_clip_uintp2(B_R + Y2, 30) >> 14);

             output_pixel(&dest[7], av_clip_uintp2(A2      , 30) >> 14);

             dest += 8;

         } else {

             output_pixel(&dest[3], av_clip_uintp2(R_B + Y2, 30) >> 14);

             output_pixel(&dest[4], av_clip_uintp2(  G + Y2, 30) >> 14);

             output_pixel(&dest[5], av_clip_uintp2(B_R + Y2, 30) >> 14);

             dest += 6;

         }

     }

 }


 static av_always_inline void

 yuv2rgba64_2_c_template(SwsContext *c, const int32_t *buf[2],

                        const int32_t *ubuf[2], const int32_t *vbuf[2],

                        const int32_t *abuf[2], uint16_t *dest, int dstW,

                        int yalpha, int uvalpha, int y,

                        enum AVPixelFormat target, int hasAlpha, int eightbytes)

 {

     const int32_t *buf0  = buf[0],  *buf1  = buf[1],

                   *ubuf0 = ubuf[0], *ubuf1 = ubuf[1],

                   *vbuf0 = vbuf[0], *vbuf1 = vbuf[1],

                   *abuf0 = hasAlpha ? abuf[0] : NULL,

                   *abuf1 = hasAlpha ? abuf[1] : NULL;

     int  yalpha1 = 4096 - yalpha;

     int uvalpha1 = 4096 - uvalpha;

     int i;

     int A1 = 0xffff<<14, A2 = 0xffff<<14;


     av_assert2(yalpha  <= 4096U);

     av_assert2(uvalpha <= 4096U);


     for (i = 0; i < ((dstW + 1) >> 1); i++) {

         int Y1 = (buf0[i * 2]     * yalpha1  + buf1[i * 2]     * yalpha) >> 14;

         int Y2 = (buf0[i * 2 + 1] * yalpha1  + buf1[i * 2 + 1] * yalpha) >> 14;

         int U  = (ubuf0[i]        * uvalpha1 + ubuf1[i]        * uvalpha - (128 << 23)) >> 14;

         int V  = (vbuf0[i]        * uvalpha1 + vbuf1[i]        * uvalpha - (128 << 23)) >> 14;

         int R, G, B;


         Y1 -= c->yuv2rgb_y_offset;

         Y2 -= c->yuv2rgb_y_offset;

         Y1 *= c->yuv2rgb_y_coeff;

         Y2 *= c->yuv2rgb_y_coeff;

         Y1 += 1 << 13;

         Y2 += 1 << 13;


         R = V * c->yuv2rgb_v2r_coeff;

         G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

         B =                            U * c->yuv2rgb_u2b_coeff;


         if (hasAlpha) {

             A1 = (abuf0[i * 2    ] * yalpha1 + abuf1[i * 2    ] * yalpha) >> 1;

             A2 = (abuf0[i * 2 + 1] * yalpha1 + abuf1[i * 2 + 1] * yalpha) >> 1;


             A1 += 1 << 13;

             A2 += 1 << 13;

         }


         output_pixel(&dest[0], av_clip_uintp2(R_B + Y1, 30) >> 14);

         output_pixel(&dest[1], av_clip_uintp2(  G + Y1, 30) >> 14);

         output_pixel(&dest[2], av_clip_uintp2(B_R + Y1, 30) >> 14);

         if (eightbytes) {

             output_pixel(&dest[3], av_clip_uintp2(A1      , 30) >> 14);

             output_pixel(&dest[4], av_clip_uintp2(R_B + Y2, 30) >> 14);

             output_pixel(&dest[5], av_clip_uintp2(  G + Y2, 30) >> 14);

             output_pixel(&dest[6], av_clip_uintp2(B_R + Y2, 30) >> 14);

             output_pixel(&dest[7], av_clip_uintp2(A2      , 30) >> 14);

             dest += 8;

         } else {

             output_pixel(&dest[3], av_clip_uintp2(R_B + Y2, 30) >> 14);

             output_pixel(&dest[4], av_clip_uintp2(  G + Y2, 30) >> 14);

             output_pixel(&dest[5], av_clip_uintp2(B_R + Y2, 30) >> 14);

             dest += 6;

         }

     }

 }


 static av_always_inline void

 yuv2rgba64_1_c_template(SwsContext *c, const int32_t *buf0,

                        const int32_t *ubuf[2], const int32_t *vbuf[2],

                        const int32_t *abuf0, uint16_t *dest, int dstW,

                        int uvalpha, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)

 {

     const int32_t *ubuf0 = ubuf[0], *vbuf0 = vbuf[0];

     int i;

     int A1 = 0xffff<<14, A2= 0xffff<<14;


     if (uvalpha < 2048) {

         for (i = 0; i < ((dstW + 1) >> 1); i++) {

             int Y1 = (buf0[i * 2]    ) >> 2;

             int Y2 = (buf0[i * 2 + 1]) >> 2;

             int U  = (ubuf0[i] - (128 << 11)) >> 2;

             int V  = (vbuf0[i] - (128 << 11)) >> 2;

             int R, G, B;


             Y1 -= c->yuv2rgb_y_offset;

             Y2 -= c->yuv2rgb_y_offset;

             Y1 *= c->yuv2rgb_y_coeff;

             Y2 *= c->yuv2rgb_y_coeff;

             Y1 += 1 << 13;

             Y2 += 1 << 13;


             if (hasAlpha) {

                 A1 = abuf0[i * 2    ] << 11;

                 A2 = abuf0[i * 2 + 1] << 11;


                 A1 += 1 << 13;

                 A2 += 1 << 13;

             }


             R = V * c->yuv2rgb_v2r_coeff;

             G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

             B =                            U * c->yuv2rgb_u2b_coeff;


             output_pixel(&dest[0], av_clip_uintp2(R_B + Y1, 30) >> 14);

             output_pixel(&dest[1], av_clip_uintp2(  G + Y1, 30) >> 14);

             output_pixel(&dest[2], av_clip_uintp2(B_R + Y1, 30) >> 14);

             if (eightbytes) {

                 output_pixel(&dest[3], av_clip_uintp2(A1      , 30) >> 14);

                 output_pixel(&dest[4], av_clip_uintp2(R_B + Y2, 30) >> 14);

                 output_pixel(&dest[5], av_clip_uintp2(  G + Y2, 30) >> 14);

                 output_pixel(&dest[6], av_clip_uintp2(B_R + Y2, 30) >> 14);

                 output_pixel(&dest[7], av_clip_uintp2(A2      , 30) >> 14);

                 dest += 8;

             } else {

                 output_pixel(&dest[3], av_clip_uintp2(R_B + Y2, 30) >> 14);

                 output_pixel(&dest[4], av_clip_uintp2(  G + Y2, 30) >> 14);

                 output_pixel(&dest[5], av_clip_uintp2(B_R + Y2, 30) >> 14);

                 dest += 6;

             }

         }

     } else {

         const int32_t *ubuf1 = ubuf[1], *vbuf1 = vbuf[1];

         int A1 = 0xffff<<14, A2 = 0xffff<<14;

         for (i = 0; i < ((dstW + 1) >> 1); i++) {

             int Y1 = (buf0[i * 2]    ) >> 2;

             int Y2 = (buf0[i * 2 + 1]) >> 2;

             int U  = (ubuf0[i] + ubuf1[i] - (128 << 12)) >> 3;

             int V  = (vbuf0[i] + vbuf1[i] - (128 << 12)) >> 3;

             int R, G, B;


             Y1 -= c->yuv2rgb_y_offset;

             Y2 -= c->yuv2rgb_y_offset;

             Y1 *= c->yuv2rgb_y_coeff;

             Y2 *= c->yuv2rgb_y_coeff;

             Y1 += 1 << 13;

             Y2 += 1 << 13;


             if (hasAlpha) {

                 A1 = abuf0[i * 2    ] << 11;

                 A2 = abuf0[i * 2 + 1] << 11;


                 A1 += 1 << 13;

                 A2 += 1 << 13;

             }


             R = V * c->yuv2rgb_v2r_coeff;

             G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

             B =                            U * c->yuv2rgb_u2b_coeff;


             output_pixel(&dest[0], av_clip_uintp2(R_B + Y1, 30) >> 14);

             output_pixel(&dest[1], av_clip_uintp2(  G + Y1, 30) >> 14);

             output_pixel(&dest[2], av_clip_uintp2(B_R + Y1, 30) >> 14);

             if (eightbytes) {

                 output_pixel(&dest[3], av_clip_uintp2(A1      , 30) >> 14);

                 output_pixel(&dest[4], av_clip_uintp2(R_B + Y2, 30) >> 14);

                 output_pixel(&dest[5], av_clip_uintp2(  G + Y2, 30) >> 14);

                 output_pixel(&dest[6], av_clip_uintp2(B_R + Y2, 30) >> 14);

                 output_pixel(&dest[7], av_clip_uintp2(A2      , 30) >> 14);

                 dest += 8;

             } else {

                 output_pixel(&dest[3], av_clip_uintp2(R_B + Y2, 30) >> 14);

                 output_pixel(&dest[4], av_clip_uintp2(  G + Y2, 30) >> 14);

                 output_pixel(&dest[5], av_clip_uintp2(B_R + Y2, 30) >> 14);

                 dest += 6;

             }

         }

     }

 }


 static av_always_inline void

 yuv2rgba64_full_X_c_template(SwsContext *c, const int16_t *lumFilter,

                        const int32_t **lumSrc, int lumFilterSize,

                        const int16_t *chrFilter, const int32_t **chrUSrc,

                        const int32_t **chrVSrc, int chrFilterSize,

                        const int32_t **alpSrc, uint16_t *dest, int dstW,

                        int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)

 {

     int i;

     int A = 0xffff<<14;


     for (i = 0; i < dstW; i++) {

         int j;

         int Y  = -0x40000000;

         int U  = -(128 << 23); // 19

         int V  = -(128 << 23);

         int R, G, B;


         for (j = 0; j < lumFilterSize; j++) {

             Y += lumSrc[j][i]  * (unsigned)lumFilter[j];

         }

         for (j = 0; j < chrFilterSize; j++) {;

             U += chrUSrc[j][i] * (unsigned)chrFilter[j];

             V += chrVSrc[j][i] * (unsigned)chrFilter[j];

         }


         if (hasAlpha) {

             A = -0x40000000;

             for (j = 0; j < lumFilterSize; j++) {

                 A += alpSrc[j][i] * (unsigned)lumFilter[j];

             }

             A >>= 1;

             A += 0x20002000;

         }


         // 8bit: 12+15=27; 16-bit: 12+19=31

         Y  >>= 14; // 10

         Y += 0x10000;

         U  >>= 14;

         V  >>= 14;


         // 8bit: 27 -> 17bit, 16bit: 31 - 14 = 17bit

         Y -= c->yuv2rgb_y_offset;

         Y *= c->yuv2rgb_y_coeff;

         Y += 1 << 13; // 21

         // 8bit: 17 + 13bit = 30bit, 16bit: 17 + 13bit = 30bit


         R = V * c->yuv2rgb_v2r_coeff;

         G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

         B =                            U * c->yuv2rgb_u2b_coeff;


         // 8bit: 30 - 22 = 8bit, 16bit: 30bit - 14 = 16bit

         output_pixel(&dest[0], av_clip_uintp2(R_B + Y, 30) >> 14);

         output_pixel(&dest[1], av_clip_uintp2(  G + Y, 30) >> 14);

         output_pixel(&dest[2], av_clip_uintp2(B_R + Y, 30) >> 14);

         if (eightbytes) {

             output_pixel(&dest[3], av_clip_uintp2(A, 30) >> 14);

             dest += 4;

         } else {

             dest += 3;

         }

     }

 }


 static av_always_inline void

 yuv2rgba64_full_2_c_template(SwsContext *c, const int32_t *buf[2],

                        const int32_t *ubuf[2], const int32_t *vbuf[2],

                        const int32_t *abuf[2], uint16_t *dest, int dstW,

                        int yalpha, int uvalpha, int y,

                        enum AVPixelFormat target, int hasAlpha, int eightbytes)

 {

     const int32_t *buf0  = buf[0],  *buf1  = buf[1],

                   *ubuf0 = ubuf[0], *ubuf1 = ubuf[1],

                   *vbuf0 = vbuf[0], *vbuf1 = vbuf[1],

                   *abuf0 = hasAlpha ? abuf[0] : NULL,

                   *abuf1 = hasAlpha ? abuf[1] : NULL;

     int  yalpha1 = 4096 - yalpha;

     int uvalpha1 = 4096 - uvalpha;

     int i;

     int A = 0xffff<<14;


     av_assert2(yalpha  <= 4096U);

     av_assert2(uvalpha <= 4096U);


     for (i = 0; i < dstW; i++) {

         int Y  = (buf0[i]     * yalpha1  + buf1[i]     * yalpha) >> 14;

         int U  = (ubuf0[i]   * uvalpha1 + ubuf1[i]     * uvalpha - (128 << 23)) >> 14;

         int V  = (vbuf0[i]   * uvalpha1 + vbuf1[i]     * uvalpha - (128 << 23)) >> 14;

         int R, G, B;


         Y -= c->yuv2rgb_y_offset;

         Y *= c->yuv2rgb_y_coeff;

         Y += 1 << 13;


         R = V * c->yuv2rgb_v2r_coeff;

         G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

         B =                            U * c->yuv2rgb_u2b_coeff;


         if (hasAlpha) {

             A = (abuf0[i] * yalpha1 + abuf1[i] * yalpha) >> 1;


             A += 1 << 13;

         }


         output_pixel(&dest[0], av_clip_uintp2(R_B + Y, 30) >> 14);

         output_pixel(&dest[1], av_clip_uintp2(  G + Y, 30) >> 14);

         output_pixel(&dest[2], av_clip_uintp2(B_R + Y, 30) >> 14);

         if (eightbytes) {

             output_pixel(&dest[3], av_clip_uintp2(A, 30) >> 14);

             dest += 4;

         } else {

             dest += 3;

         }

     }

 }


 static av_always_inline void

 yuv2rgba64_full_1_c_template(SwsContext *c, const int32_t *buf0,

                        const int32_t *ubuf[2], const int32_t *vbuf[2],

                        const int32_t *abuf0, uint16_t *dest, int dstW,

                        int uvalpha, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)

 {

     const int32_t *ubuf0 = ubuf[0], *vbuf0 = vbuf[0];

     int i;

     int A = 0xffff<<14;


     if (uvalpha < 2048) {

         for (i = 0; i < dstW; i++) {

             int Y  = (buf0[i]) >> 2;

             int U  = (ubuf0[i] - (128 << 11)) >> 2;

             int V  = (vbuf0[i] - (128 << 11)) >> 2;

             int R, G, B;


             Y -= c->yuv2rgb_y_offset;

             Y *= c->yuv2rgb_y_coeff;

             Y += 1 << 13;


             if (hasAlpha) {

                 A = abuf0[i] << 11;


                 A += 1 << 13;

             }


             R = V * c->yuv2rgb_v2r_coeff;

             G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

             B =                            U * c->yuv2rgb_u2b_coeff;


             output_pixel(&dest[0], av_clip_uintp2(R_B + Y, 30) >> 14);

             output_pixel(&dest[1], av_clip_uintp2(  G + Y, 30) >> 14);

             output_pixel(&dest[2], av_clip_uintp2(B_R + Y, 30) >> 14);

             if (eightbytes) {

                 output_pixel(&dest[3], av_clip_uintp2(A, 30) >> 14);

                 dest += 4;

             } else {

                 dest += 3;

             }

         }

     } else {

         const int32_t *ubuf1 = ubuf[1], *vbuf1 = vbuf[1];

         int A = 0xffff<<14;

         for (i = 0; i < dstW; i++) {

             int Y  = (buf0[i]    ) >> 2;

             int U  = (ubuf0[i] + ubuf1[i] - (128 << 12)) >> 3;

             int V  = (vbuf0[i] + vbuf1[i] - (128 << 12)) >> 3;

             int R, G, B;


             Y -= c->yuv2rgb_y_offset;

             Y *= c->yuv2rgb_y_coeff;

             Y += 1 << 13;


             if (hasAlpha) {

                 A = abuf0[i] << 11;


                 A += 1 << 13;

             }


             R = V * c->yuv2rgb_v2r_coeff;

             G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

             B =                            U * c->yuv2rgb_u2b_coeff;


             output_pixel(&dest[0], av_clip_uintp2(R_B + Y, 30) >> 14);

             output_pixel(&dest[1], av_clip_uintp2(  G + Y, 30) >> 14);

             output_pixel(&dest[2], av_clip_uintp2(B_R + Y, 30) >> 14);

             if (eightbytes) {

                 output_pixel(&dest[3], av_clip_uintp2(A, 30) >> 14);

                 dest += 4;

             } else {

                 dest += 3;

             }

         }

     }

 }


 #undef output_pixel

 #undef r_b

 #undef b_r


 #define YUV2PACKED16WRAPPER(name, base, ext, fmt, hasAlpha, eightbytes) \

 static void name ## ext ## _X_c(SwsContext *c, const int16_t *lumFilter, \

                         const int16_t **_lumSrc, int lumFilterSize, \

                         const int16_t *chrFilter, const int16_t **_chrUSrc, \

                         const int16_t **_chrVSrc, int chrFilterSize, \

                         const int16_t **_alpSrc, uint8_t *_dest, int dstW, \

                         int y) \

 { \

     const int32_t **lumSrc  = (const int32_t **) _lumSrc, \

                   **chrUSrc = (const int32_t **) _chrUSrc, \

                   **chrVSrc = (const int32_t **) _chrVSrc, \

                   **alpSrc  = (const int32_t **) _alpSrc; \

     uint16_t *dest = (uint16_t *) _dest; \

     name ## base ## _X_c_template(c, lumFilter, lumSrc, lumFilterSize, \

                           chrFilter, chrUSrc, chrVSrc, chrFilterSize, \

                           alpSrc, dest, dstW, y, fmt, hasAlpha, eightbytes); \

 } \

  \

 static void name ## ext ## _2_c(SwsContext *c, const int16_t *_buf[2], \

                         const int16_t *_ubuf[2], const int16_t *_vbuf[2], \

                         const int16_t *_abuf[2], uint8_t *_dest, int dstW, \

                         int yalpha, int uvalpha, int y) \

 { \

     const int32_t **buf  = (const int32_t **) _buf, \

                   **ubuf = (const int32_t **) _ubuf, \

                   **vbuf = (const int32_t **) _vbuf, \

                   **abuf = (const int32_t **) _abuf; \

     uint16_t *dest = (uint16_t *) _dest; \

     name ## base ## _2_c_template(c, buf, ubuf, vbuf, abuf, \

                           dest, dstW, yalpha, uvalpha, y, fmt, hasAlpha, eightbytes); \

 } \

  \

 static void name ## ext ## _1_c(SwsContext *c, const int16_t *_buf0, \

                         const int16_t *_ubuf[2], const int16_t *_vbuf[2], \

                         const int16_t *_abuf0, uint8_t *_dest, int dstW, \

                         int uvalpha, int y) \

 { \

     const int32_t *buf0  = (const int32_t *)  _buf0, \

                  **ubuf  = (const int32_t **) _ubuf, \

                  **vbuf  = (const int32_t **) _vbuf, \

                   *abuf0 = (const int32_t *)  _abuf0; \

     uint16_t *dest = (uint16_t *) _dest; \

     name ## base ## _1_c_template(c, buf0, ubuf, vbuf, abuf0, dest, \

                                   dstW, uvalpha, y, fmt, hasAlpha, eightbytes); \

 }


 YUV2PACKED16WRAPPER(yuv2, rgba64, rgb48be, AV_PIX_FMT_RGB48BE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64, rgb48le, AV_PIX_FMT_RGB48LE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64, bgr48be, AV_PIX_FMT_BGR48BE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64, bgr48le, AV_PIX_FMT_BGR48LE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64, rgba64be, AV_PIX_FMT_RGBA64BE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64, rgba64le, AV_PIX_FMT_RGBA64LE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64, rgbx64be, AV_PIX_FMT_RGBA64BE, 0, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64, rgbx64le, AV_PIX_FMT_RGBA64LE, 0, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64, bgra64be, AV_PIX_FMT_BGRA64BE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64, bgra64le, AV_PIX_FMT_BGRA64LE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64, bgrx64be, AV_PIX_FMT_BGRA64BE, 0, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64, bgrx64le, AV_PIX_FMT_BGRA64LE, 0, 1)


 YUV2PACKED16WRAPPER(yuv2, rgba64_full, rgb48be_full, AV_PIX_FMT_RGB48BE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, rgb48le_full, AV_PIX_FMT_RGB48LE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, bgr48be_full, AV_PIX_FMT_BGR48BE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, bgr48le_full, AV_PIX_FMT_BGR48LE, 0, 0)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, rgba64be_full, AV_PIX_FMT_RGBA64BE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, rgba64le_full, AV_PIX_FMT_RGBA64LE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, rgbx64be_full, AV_PIX_FMT_RGBA64BE, 0, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, rgbx64le_full, AV_PIX_FMT_RGBA64LE, 0, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, bgra64be_full, AV_PIX_FMT_BGRA64BE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, bgra64le_full, AV_PIX_FMT_BGRA64LE, 1, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, bgrx64be_full, AV_PIX_FMT_BGRA64BE, 0, 1)

 YUV2PACKED16WRAPPER(yuv2, rgba64_full, bgrx64le_full, AV_PIX_FMT_BGRA64LE, 0, 1)


 /*

  * Write out 2 RGB pixels in the target pixel format. This function takes a

  * R/G/B LUT as generated by ff_yuv2rgb_c_init_tables(), which takes care of

  * things like endianness conversion and shifting. The caller takes care of

  * setting the correct offset in these tables from the chroma (U/V) values.

  * This function then uses the luminance (Y1/Y2) values to write out the

  * correct RGB values into the destination buffer.

  */

 static av_always_inline void

 yuv2rgb_write(uint8_t *_dest, int i, int Y1, int Y2,

               unsigned A1, unsigned A2,

               const void *_r, const void *_g, const void *_b, int y,

               enum AVPixelFormat target, int hasAlpha)

 {

     if (target == AV_PIX_FMT_ARGB || target == AV_PIX_FMT_RGBA ||

         target == AV_PIX_FMT_ABGR || target == AV_PIX_FMT_BGRA) {

         uint32_t *dest = (uint32_t *) _dest;

         const uint32_t *r = (const uint32_t *) _r;

         const uint32_t *g = (const uint32_t *) _g;

         const uint32_t *b = (const uint32_t *) _b;


 #if CONFIG_SMALL

         int sh = hasAlpha ? ((target == AV_PIX_FMT_RGB32_1 || target == AV_PIX_FMT_BGR32_1) ? 0 : 24) : 0;


         dest[i * 2 + 0] = r[Y1] + g[Y1] + b[Y1] + (hasAlpha ? A1 << sh : 0);

         dest[i * 2 + 1] = r[Y2] + g[Y2] + b[Y2] + (hasAlpha ? A2 << sh : 0);

 #else

         if (hasAlpha) {

             int sh = (target == AV_PIX_FMT_RGB32_1 || target == AV_PIX_FMT_BGR32_1) ? 0 : 24;


             av_assert2((((r[Y1] + g[Y1] + b[Y1]) >> sh) & 0xFF) == 0);

             dest[i * 2 + 0] = r[Y1] + g[Y1] + b[Y1] + (A1 << sh);

             dest[i * 2 + 1] = r[Y2] + g[Y2] + b[Y2] + (A2 << sh);

         } else {

 #if defined(ASSERT_LEVEL) && ASSERT_LEVEL > 1

             int sh = (target == AV_PIX_FMT_RGB32_1 || target == AV_PIX_FMT_BGR32_1) ? 0 : 24;


             av_assert2((((r[Y1] + g[Y1] + b[Y1]) >> sh) & 0xFF) == 0xFF);

 #endif

             dest[i * 2 + 0] = r[Y1] + g[Y1] + b[Y1];

             dest[i * 2 + 1] = r[Y2] + g[Y2] + b[Y2];

         }

 #endif

     } else if (target == AV_PIX_FMT_RGB24 || target == AV_PIX_FMT_BGR24) {

         uint8_t *dest = (uint8_t *) _dest;

         const uint8_t *r = (const uint8_t *) _r;

         const uint8_t *g = (const uint8_t *) _g;

         const uint8_t *b = (const uint8_t *) _b;


 #define r_b ((target == AV_PIX_FMT_RGB24) ? r : b)

 #define b_r ((target == AV_PIX_FMT_RGB24) ? b : r)


         dest[i * 6 + 0] = r_b[Y1];

         dest[i * 6 + 1] =   g[Y1];

         dest[i * 6 + 2] = b_r[Y1];

         dest[i * 6 + 3] = r_b[Y2];

         dest[i * 6 + 4] =   g[Y2];

         dest[i * 6 + 5] = b_r[Y2];

 #undef r_b

 #undef b_r

     } else if (target == AV_PIX_FMT_RGB565 || target == AV_PIX_FMT_BGR565 ||

                target == AV_PIX_FMT_RGB555 || target == AV_PIX_FMT_BGR555 ||

                target == AV_PIX_FMT_RGB444 || target == AV_PIX_FMT_BGR444) {

         uint16_t *dest = (uint16_t *) _dest;

         const uint16_t *r = (const uint16_t *) _r;

         const uint16_t *g = (const uint16_t *) _g;

         const uint16_t *b = (const uint16_t *) _b;

         int dr1, dg1, db1, dr2, dg2, db2;


         if (target == AV_PIX_FMT_RGB565 || target == AV_PIX_FMT_BGR565) {

             dr1 = ff_dither_2x2_8[ y & 1     ][0];

             dg1 = ff_dither_2x2_4[ y & 1     ][0];

             db1 = ff_dither_2x2_8[(y & 1) ^ 1][0];

             dr2 = ff_dither_2x2_8[ y & 1     ][1];

             dg2 = ff_dither_2x2_4[ y & 1     ][1];

             db2 = ff_dither_2x2_8[(y & 1) ^ 1][1];

         } else if (target == AV_PIX_FMT_RGB555 || target == AV_PIX_FMT_BGR555) {

             dr1 = ff_dither_2x2_8[ y & 1     ][0];

             dg1 = ff_dither_2x2_8[ y & 1     ][1];

             db1 = ff_dither_2x2_8[(y & 1) ^ 1][0];

             dr2 = ff_dither_2x2_8[ y & 1     ][1];

             dg2 = ff_dither_2x2_8[ y & 1     ][0];

             db2 = ff_dither_2x2_8[(y & 1) ^ 1][1];

         } else {

             dr1 = ff_dither_4x4_16[ y & 3     ][0];

             dg1 = ff_dither_4x4_16[ y & 3     ][1];

             db1 = ff_dither_4x4_16[(y & 3) ^ 3][0];

             dr2 = ff_dither_4x4_16[ y & 3     ][1];

             dg2 = ff_dither_4x4_16[ y & 3     ][0];

             db2 = ff_dither_4x4_16[(y & 3) ^ 3][1];

         }


         dest[i * 2 + 0] = r[Y1 + dr1] + g[Y1 + dg1] + b[Y1 + db1];

         dest[i * 2 + 1] = r[Y2 + dr2] + g[Y2 + dg2] + b[Y2 + db2];

     } else /* 8/4 bits */ {

         uint8_t *dest = (uint8_t *) _dest;

         const uint8_t *r = (const uint8_t *) _r;

         const uint8_t *g = (const uint8_t *) _g;

         const uint8_t *b = (const uint8_t *) _b;

         int dr1, dg1, db1, dr2, dg2, db2;


         if (target == AV_PIX_FMT_RGB8 || target == AV_PIX_FMT_BGR8) {

             const uint8_t * const d64 = ff_dither_8x8_73[y & 7];

             const uint8_t * const d32 = ff_dither_8x8_32[y & 7];

             dr1 = dg1 = d32[(i * 2 + 0) & 7];

             db1 =       d64[(i * 2 + 0) & 7];

             dr2 = dg2 = d32[(i * 2 + 1) & 7];

             db2 =       d64[(i * 2 + 1) & 7];

         } else {

             const uint8_t * const d64  = ff_dither_8x8_73 [y & 7];

             const uint8_t * const d128 = ff_dither_8x8_220[y & 7];

             dr1 = db1 = d128[(i * 2 + 0) & 7];

             dg1 =        d64[(i * 2 + 0) & 7];

             dr2 = db2 = d128[(i * 2 + 1) & 7];

             dg2 =        d64[(i * 2 + 1) & 7];

         }


         if (target == AV_PIX_FMT_RGB4 || target == AV_PIX_FMT_BGR4) {

             dest[i] = r[Y1 + dr1] + g[Y1 + dg1] + b[Y1 + db1] +

                     ((r[Y2 + dr2] + g[Y2 + dg2] + b[Y2 + db2]) << 4);

         } else {

             dest[i * 2 + 0] = r[Y1 + dr1] + g[Y1 + dg1] + b[Y1 + db1];

             dest[i * 2 + 1] = r[Y2 + dr2] + g[Y2 + dg2] + b[Y2 + db2];

         }

     }

 }


 static av_always_inline void

 yuv2rgb_X_c_template(SwsContext *c, const int16_t *lumFilter,

                      const int16_t **lumSrc, int lumFilterSize,

                      const int16_t *chrFilter, const int16_t **chrUSrc,

                      const int16_t **chrVSrc, int chrFilterSize,

                      const int16_t **alpSrc, uint8_t *dest, int dstW,

                      int y, enum AVPixelFormat target, int hasAlpha)

 {

     int i;


     for (i = 0; i < ((dstW + 1) >> 1); i++) {

         int j, A1, A2;

         int Y1 = 1 << 18;

         int Y2 = 1 << 18;

         int U  = 1 << 18;

         int V  = 1 << 18;

         const void *r, *g, *b;


         for (j = 0; j < lumFilterSize; j++) {

             Y1 += lumSrc[j][i * 2]     * lumFilter[j];

             Y2 += lumSrc[j][i * 2 + 1] * lumFilter[j];

         }

         for (j = 0; j < chrFilterSize; j++) {

             U += chrUSrc[j][i] * chrFilter[j];

             V += chrVSrc[j][i] * chrFilter[j];

         }

         Y1 >>= 19;

         Y2 >>= 19;

         U  >>= 19;

         V  >>= 19;

         if (hasAlpha) {

             A1 = 1 << 18;

             A2 = 1 << 18;

             for (j = 0; j < lumFilterSize; j++) {

                 A1 += alpSrc[j][i * 2    ] * lumFilter[j];

                 A2 += alpSrc[j][i * 2 + 1] * lumFilter[j];

             }

             A1 >>= 19;

             A2 >>= 19;

             if ((A1 | A2) & 0x100) {

                 A1 = av_clip_uint8(A1);

                 A2 = av_clip_uint8(A2);

             }

         }


         r =  c->table_rV[V + YUVRGB_TABLE_HEADROOM];

         g = (c->table_gU[U + YUVRGB_TABLE_HEADROOM] + c->table_gV[V + YUVRGB_TABLE_HEADROOM]);

         b =  c->table_bU[U + YUVRGB_TABLE_HEADROOM];


         yuv2rgb_write(dest, i, Y1, Y2, hasAlpha ? A1 : 0, hasAlpha ? A2 : 0,

                       r, g, b, y, target, hasAlpha);

     }

 }


 static av_always_inline void

 yuv2rgb_2_c_template(SwsContext *c, const int16_t *buf[2],

                      const int16_t *ubuf[2], const int16_t *vbuf[2],

                      const int16_t *abuf[2], uint8_t *dest, int dstW,

                      int yalpha, int uvalpha, int y,

                      enum AVPixelFormat target, int hasAlpha)

 {

     const int16_t *buf0  = buf[0],  *buf1  = buf[1],

                   *ubuf0 = ubuf[0], *ubuf1 = ubuf[1],

                   *vbuf0 = vbuf[0], *vbuf1 = vbuf[1],

                   *abuf0 = hasAlpha ? abuf[0] : NULL,

                   *abuf1 = hasAlpha ? abuf[1] : NULL;

     int  yalpha1 = 4096 - yalpha;

     int uvalpha1 = 4096 - uvalpha;

     int i;

     av_assert2(yalpha  <= 4096U);

     av_assert2(uvalpha <= 4096U);


     for (i = 0; i < ((dstW + 1) >> 1); i++) {

         int Y1 = (buf0[i * 2]     * yalpha1  + buf1[i * 2]     * yalpha)  >> 19;

         int Y2 = (buf0[i * 2 + 1] * yalpha1  + buf1[i * 2 + 1] * yalpha)  >> 19;

         int U  = (ubuf0[i]        * uvalpha1 + ubuf1[i]        * uvalpha) >> 19;

         int V  = (vbuf0[i]        * uvalpha1 + vbuf1[i]        * uvalpha) >> 19;

         int A1, A2;

         const void *r =  c->table_rV[V + YUVRGB_TABLE_HEADROOM],

                    *g = (c->table_gU[U + YUVRGB_TABLE_HEADROOM] + c->table_gV[V + YUVRGB_TABLE_HEADROOM]),

                    *b =  c->table_bU[U + YUVRGB_TABLE_HEADROOM];


         if (hasAlpha) {

             A1 = (abuf0[i * 2    ] * yalpha1 + abuf1[i * 2    ] * yalpha) >> 19;

             A2 = (abuf0[i * 2 + 1] * yalpha1 + abuf1[i * 2 + 1] * yalpha) >> 19;

             A1 = av_clip_uint8(A1);

             A2 = av_clip_uint8(A2);

         }


         yuv2rgb_write(dest, i, Y1, Y2, hasAlpha ? A1 : 0, hasAlpha ? A2 : 0,

                       r, g, b, y, target, hasAlpha);

     }

 }


 static av_always_inline void

 yuv2rgb_1_c_template(SwsContext *c, const int16_t *buf0,

                      const int16_t *ubuf[2], const int16_t *vbuf[2],

                      const int16_t *abuf0, uint8_t *dest, int dstW,

                      int uvalpha, int y, enum AVPixelFormat target,

                      int hasAlpha)

 {

     const int16_t *ubuf0 = ubuf[0], *vbuf0 = vbuf[0];

     int i;


     if (uvalpha < 2048) {

         for (i = 0; i < ((dstW + 1) >> 1); i++) {

             int Y1 = (buf0[i * 2    ] + 64) >> 7;

             int Y2 = (buf0[i * 2 + 1] + 64) >> 7;

             int U  = (ubuf0[i]        + 64) >> 7;

             int V  = (vbuf0[i]        + 64) >> 7;

             int A1, A2;

             const void *r =  c->table_rV[V + YUVRGB_TABLE_HEADROOM],

                        *g = (c->table_gU[U + YUVRGB_TABLE_HEADROOM] + c->table_gV[V + YUVRGB_TABLE_HEADROOM]),

                        *b =  c->table_bU[U + YUVRGB_TABLE_HEADROOM];


             if (hasAlpha) {

                 A1 = abuf0[i * 2    ] * 255 + 16384 >> 15;

                 A2 = abuf0[i * 2 + 1] * 255 + 16384 >> 15;

                 A1 = av_clip_uint8(A1);

                 A2 = av_clip_uint8(A2);

             }


             yuv2rgb_write(dest, i, Y1, Y2, hasAlpha ? A1 : 0, hasAlpha ? A2 : 0,

                           r, g, b, y, target, hasAlpha);

         }

     } else {

         const int16_t *ubuf1 = ubuf[1], *vbuf1 = vbuf[1];

         for (i = 0; i < ((dstW + 1) >> 1); i++) {

             int Y1 = (buf0[i * 2    ]     +  64) >> 7;

             int Y2 = (buf0[i * 2 + 1]     +  64) >> 7;

             int U  = (ubuf0[i] + ubuf1[i] + 128) >> 8;

             int V  = (vbuf0[i] + vbuf1[i] + 128) >> 8;

             int A1, A2;

             const void *r =  c->table_rV[V + YUVRGB_TABLE_HEADROOM],

                        *g = (c->table_gU[U + YUVRGB_TABLE_HEADROOM] + c->table_gV[V + YUVRGB_TABLE_HEADROOM]),

                        *b =  c->table_bU[U + YUVRGB_TABLE_HEADROOM];


             if (hasAlpha) {

                 A1 = (abuf0[i * 2    ] + 64) >> 7;

                 A2 = (abuf0[i * 2 + 1] + 64) >> 7;

                 A1 = av_clip_uint8(A1);

                 A2 = av_clip_uint8(A2);

             }


             yuv2rgb_write(dest, i, Y1, Y2, hasAlpha ? A1 : 0, hasAlpha ? A2 : 0,

                           r, g, b, y, target, hasAlpha);

         }

     }

 }


 #define YUV2RGBWRAPPERX(name, base, ext, fmt, hasAlpha) \

 static void name ## ext ## _X_c(SwsContext *c, const int16_t *lumFilter, \

                                 const int16_t **lumSrc, int lumFilterSize, \

                                 const int16_t *chrFilter, const int16_t **chrUSrc, \

                                 const int16_t **chrVSrc, int chrFilterSize, \

                                 const int16_t **alpSrc, uint8_t *dest, int dstW, \

                                 int y) \

 { \

     name ## base ## _X_c_template(c, lumFilter, lumSrc, lumFilterSize, \

                                   chrFilter, chrUSrc, chrVSrc, chrFilterSize, \

                                   alpSrc, dest, dstW, y, fmt, hasAlpha); \

 }


 #define YUV2RGBWRAPPERX2(name, base, ext, fmt, hasAlpha) \

 YUV2RGBWRAPPERX(name, base, ext, fmt, hasAlpha) \

 static void name ## ext ## _2_c(SwsContext *c, const int16_t *buf[2], \

                                 const int16_t *ubuf[2], const int16_t *vbuf[2], \

                                 const int16_t *abuf[2], uint8_t *dest, int dstW, \

                                 int yalpha, int uvalpha, int y) \

 { \

     name ## base ## _2_c_template(c, buf, ubuf, vbuf, abuf, \

                                   dest, dstW, yalpha, uvalpha, y, fmt, hasAlpha); \

 }


 #define YUV2RGBWRAPPER(name, base, ext, fmt, hasAlpha) \

 YUV2RGBWRAPPERX2(name, base, ext, fmt, hasAlpha) \

 static void name ## ext ## _1_c(SwsContext *c, const int16_t *buf0, \

                                 const int16_t *ubuf[2], const int16_t *vbuf[2], \

                                 const int16_t *abuf0, uint8_t *dest, int dstW, \

                                 int uvalpha, int y) \

 { \

     name ## base ## _1_c_template(c, buf0, ubuf, vbuf, abuf0, dest, \

                                   dstW, uvalpha, y, fmt, hasAlpha); \

 }


 #if CONFIG_SMALL

 YUV2RGBWRAPPER(yuv2rgb,,  32_1,  AV_PIX_FMT_RGB32_1,   CONFIG_SWSCALE_ALPHA && c->needAlpha)

 YUV2RGBWRAPPER(yuv2rgb,,  32,    AV_PIX_FMT_RGB32,     CONFIG_SWSCALE_ALPHA && c->needAlpha)

 #else

 #if CONFIG_SWSCALE_ALPHA

 YUV2RGBWRAPPER(yuv2rgb,, a32_1,  AV_PIX_FMT_RGB32_1,   1)

 YUV2RGBWRAPPER(yuv2rgb,, a32,    AV_PIX_FMT_RGB32,     1)

 #endif

 YUV2RGBWRAPPER(yuv2rgb,, x32_1,  AV_PIX_FMT_RGB32_1,   0)

 YUV2RGBWRAPPER(yuv2rgb,, x32,    AV_PIX_FMT_RGB32,     0)

 #endif

 YUV2RGBWRAPPER(yuv2, rgb, rgb24, AV_PIX_FMT_RGB24,   0)

 YUV2RGBWRAPPER(yuv2, rgb, bgr24, AV_PIX_FMT_BGR24,   0)

 YUV2RGBWRAPPER(yuv2rgb,,  16,    AV_PIX_FMT_RGB565,    0)

 YUV2RGBWRAPPER(yuv2rgb,,  15,    AV_PIX_FMT_RGB555,    0)

 YUV2RGBWRAPPER(yuv2rgb,,  12,    AV_PIX_FMT_RGB444,    0)

 YUV2RGBWRAPPER(yuv2rgb,,   8,    AV_PIX_FMT_RGB8,      0)

 YUV2RGBWRAPPER(yuv2rgb,,   4,    AV_PIX_FMT_RGB4,      0)

 YUV2RGBWRAPPER(yuv2rgb,,   4b,   AV_PIX_FMT_RGB4_BYTE, 0)


 static av_always_inline void yuv2rgb_write_full(SwsContext *c,

     uint8_t *dest, int i, int Y, int A, int U, int V,

     int y, enum AVPixelFormat target, int hasAlpha, int err[4])

 {

     int R, G, B;

     int isrgb8 = target == AV_PIX_FMT_BGR8 || target == AV_PIX_FMT_RGB8;


     Y -= c->yuv2rgb_y_offset;

     Y *= c->yuv2rgb_y_coeff;

     Y += 1 << 21;

     R = Y + V*c->yuv2rgb_v2r_coeff;

     G = Y + V*c->yuv2rgb_v2g_coeff + U*c->yuv2rgb_u2g_coeff;

     B = Y +                          U*c->yuv2rgb_u2b_coeff;

     if ((R | G | B) & 0xC0000000) {

         R = av_clip_uintp2(R, 30);

         G = av_clip_uintp2(G, 30);

         B = av_clip_uintp2(B, 30);

     }


     switch(target) {

     case AV_PIX_FMT_ARGB:

         dest[0] = hasAlpha ? A : 255;

         dest[1] = R >> 22;

         dest[2] = G >> 22;

         dest[3] = B >> 22;

         break;

     case AV_PIX_FMT_RGB24:

         dest[0] = R >> 22;

         dest[1] = G >> 22;

         dest[2] = B >> 22;

         break;

     case AV_PIX_FMT_RGBA:

         dest[0] = R >> 22;

         dest[1] = G >> 22;

         dest[2] = B >> 22;

         dest[3] = hasAlpha ? A : 255;

         break;

     case AV_PIX_FMT_ABGR:

         dest[0] = hasAlpha ? A : 255;

         dest[1] = B >> 22;

         dest[2] = G >> 22;

         dest[3] = R >> 22;

         break;

     case AV_PIX_FMT_BGR24:

         dest[0] = B >> 22;

         dest[1] = G >> 22;

         dest[2] = R >> 22;

         break;

     case AV_PIX_FMT_BGRA:

         dest[0] = B >> 22;

         dest[1] = G >> 22;

         dest[2] = R >> 22;

         dest[3] = hasAlpha ? A : 255;

         break;

     case AV_PIX_FMT_BGR4_BYTE:

     case AV_PIX_FMT_RGB4_BYTE:

     case AV_PIX_FMT_BGR8:

     case AV_PIX_FMT_RGB8:

     {

         int r,g,b;


         switch (c->dither) {

         default:

         case SWS_DITHER_AUTO:

         case SWS_DITHER_ED:

             R >>= 22;

             G >>= 22;

             B >>= 22;

             R += (7*err[0] + 1*c->dither_error[0][i] + 5*c->dither_error[0][i+1] + 3*c->dither_error[0][i+2])>>4;

             G += (7*err[1] + 1*c->dither_error[1][i] + 5*c->dither_error[1][i+1] + 3*c->dither_error[1][i+2])>>4;

             B += (7*err[2] + 1*c->dither_error[2][i] + 5*c->dither_error[2][i+1] + 3*c->dither_error[2][i+2])>>4;

             c->dither_error[0][i] = err[0];

             c->dither_error[1][i] = err[1];

             c->dither_error[2][i] = err[2];

             r = R >> (isrgb8 ? 5 : 7);

             g = G >> (isrgb8 ? 5 : 6);

             b = B >> (isrgb8 ? 6 : 7);

             r = av_clip(r, 0, isrgb8 ? 7 : 1);

             g = av_clip(g, 0, isrgb8 ? 7 : 3);

             b = av_clip(b, 0, isrgb8 ? 3 : 1);

             err[0] = R - r*(isrgb8 ? 36 : 255);

             err[1] = G - g*(isrgb8 ? 36 : 85);

             err[2] = B - b*(isrgb8 ? 85 : 255);

             break;

         case SWS_DITHER_A_DITHER:

             if (isrgb8) {

   /* see http://pippin.gimp.org/a_dither/ for details/origin */

 #define A_DITHER(u,v)   (((((u)+((v)*236))*119)&0xff))

                 r = (((R >> 19) + A_DITHER(i,y)  -96)>>8);

                 g = (((G >> 19) + A_DITHER(i + 17,y) - 96)>>8);

                 b = (((B >> 20) + A_DITHER(i + 17*2,y) -96)>>8);

                 r = av_clip_uintp2(r, 3);

                 g = av_clip_uintp2(g, 3);

                 b = av_clip_uintp2(b, 2);

             } else {

                 r = (((R >> 21) + A_DITHER(i,y)-256)>>8);

                 g = (((G >> 19) + A_DITHER(i + 17,y)-256)>>8);

                 b = (((B >> 21) + A_DITHER(i + 17*2,y)-256)>>8);

                 r = av_clip_uintp2(r, 1);

                 g = av_clip_uintp2(g, 2);

                 b = av_clip_uintp2(b, 1);

             }

             break;

         case SWS_DITHER_X_DITHER:

             if (isrgb8) {

   /* see http://pippin.gimp.org/a_dither/ for details/origin */

 #define X_DITHER(u,v)   (((((u)^((v)*237))*181)&0x1ff)/2)

                 r = (((R >> 19) + X_DITHER(i,y) - 96)>>8);

                 g = (((G >> 19) + X_DITHER(i + 17,y) - 96)>>8);

                 b = (((B >> 20) + X_DITHER(i + 17*2,y) - 96)>>8);

                 r = av_clip_uintp2(r, 3);

                 g = av_clip_uintp2(g, 3);

                 b = av_clip_uintp2(b, 2);

             } else {

                 r = (((R >> 21) + X_DITHER(i,y)-256)>>8);

                 g = (((G >> 19) + X_DITHER(i + 17,y)-256)>>8);

                 b = (((B >> 21) + X_DITHER(i + 17*2,y)-256)>>8);

                 r = av_clip_uintp2(r, 1);

                 g = av_clip_uintp2(g, 2);

                 b = av_clip_uintp2(b, 1);

             }


             break;

         }


         if(target == AV_PIX_FMT_BGR4_BYTE) {

             dest[0] = r + 2*g + 8*b;

         } else if(target == AV_PIX_FMT_RGB4_BYTE) {

             dest[0] = b + 2*g + 8*r;

         } else if(target == AV_PIX_FMT_BGR8) {

             dest[0] = r + 8*g + 64*b;

         } else if(target == AV_PIX_FMT_RGB8) {

             dest[0] = b + 4*g + 32*r;

         } else

             av_assert2(0);

         break;}

     }

 }


 static av_always_inline void

 yuv2rgb_full_X_c_template(SwsContext *c, const int16_t *lumFilter,

                           const int16_t **lumSrc, int lumFilterSize,

                           const int16_t *chrFilter, const int16_t **chrUSrc,

                           const int16_t **chrVSrc, int chrFilterSize,

                           const int16_t **alpSrc, uint8_t *dest,

                           int dstW, int y, enum AVPixelFormat target, int hasAlpha)

 {

     int i;

     int step = (target == AV_PIX_FMT_RGB24 || target == AV_PIX_FMT_BGR24) ? 3 : 4;

     int err[4] = {0};

     int A = 0; //init to silence warning


     if(   target == AV_PIX_FMT_BGR4_BYTE || target == AV_PIX_FMT_RGB4_BYTE

        || target == AV_PIX_FMT_BGR8      || target == AV_PIX_FMT_RGB8)

         step = 1;


     for (i = 0; i < dstW; i++) {

         int j;

         int Y = 1<<9;

         int U = (1<<9)-(128 << 19);

         int V = (1<<9)-(128 << 19);


         for (j = 0; j < lumFilterSize; j++) {

             Y += lumSrc[j][i] * lumFilter[j];

         }

         for (j = 0; j < chrFilterSize; j++) {

             U += chrUSrc[j][i] * chrFilter[j];

             V += chrVSrc[j][i] * chrFilter[j];

         }

         Y >>= 10;

         U >>= 10;

         V >>= 10;

         if (hasAlpha) {

             A = 1 << 18;

             for (j = 0; j < lumFilterSize; j++) {

                 A += alpSrc[j][i] * lumFilter[j];

             }

             A >>= 19;

             if (A & 0x100)

                 A = av_clip_uint8(A);

         }

         yuv2rgb_write_full(c, dest, i, Y, A, U, V, y, target, hasAlpha, err);

         dest += step;

     }

     c->dither_error[0][i] = err[0];

     c->dither_error[1][i] = err[1];

     c->dither_error[2][i] = err[2];

 }


 static av_always_inline void

 yuv2rgb_full_2_c_template(SwsContext *c, const int16_t *buf[2],

                      const int16_t *ubuf[2], const int16_t *vbuf[2],

                      const int16_t *abuf[2], uint8_t *dest, int dstW,

                      int yalpha, int uvalpha, int y,

                      enum AVPixelFormat target, int hasAlpha)

 {

     const int16_t *buf0  = buf[0],  *buf1  = buf[1],

                   *ubuf0 = ubuf[0], *ubuf1 = ubuf[1],

                   *vbuf0 = vbuf[0], *vbuf1 = vbuf[1],

                   *abuf0 = hasAlpha ? abuf[0] : NULL,

                   *abuf1 = hasAlpha ? abuf[1] : NULL;

     int  yalpha1 = 4096 - yalpha;

     int uvalpha1 = 4096 - uvalpha;

     int i;

     int step = (target == AV_PIX_FMT_RGB24 || target == AV_PIX_FMT_BGR24) ? 3 : 4;

     int err[4] = {0};

     int A = 0; // init to silcene warning


     av_assert2(yalpha  <= 4096U);

     av_assert2(uvalpha <= 4096U);


     if(   target == AV_PIX_FMT_BGR4_BYTE || target == AV_PIX_FMT_RGB4_BYTE

        || target == AV_PIX_FMT_BGR8      || target == AV_PIX_FMT_RGB8)

         step = 1;


     for (i = 0; i < dstW; i++) {

         int Y = ( buf0[i] * yalpha1  +  buf1[i] * yalpha             ) >> 10; //FIXME rounding

         int U = (ubuf0[i] * uvalpha1 + ubuf1[i] * uvalpha-(128 << 19)) >> 10;

         int V = (vbuf0[i] * uvalpha1 + vbuf1[i] * uvalpha-(128 << 19)) >> 10;


         if (hasAlpha) {

             A = (abuf0[i] * yalpha1 + abuf1[i] * yalpha + (1<<18)) >> 19;

             if (A & 0x100)

                 A = av_clip_uint8(A);

         }


         yuv2rgb_write_full(c, dest, i, Y, A, U, V, y, target, hasAlpha, err);

         dest += step;

     }

     c->dither_error[0][i] = err[0];

     c->dither_error[1][i] = err[1];

     c->dither_error[2][i] = err[2];

 }


 static av_always_inline void

 yuv2rgb_full_1_c_template(SwsContext *c, const int16_t *buf0,

                      const int16_t *ubuf[2], const int16_t *vbuf[2],

                      const int16_t *abuf0, uint8_t *dest, int dstW,

                      int uvalpha, int y, enum AVPixelFormat target,

                      int hasAlpha)

 {

     const int16_t *ubuf0 = ubuf[0], *vbuf0 = vbuf[0];

     int i;

     int step = (target == AV_PIX_FMT_RGB24 || target == AV_PIX_FMT_BGR24) ? 3 : 4;

     int err[4] = {0};


     if(   target == AV_PIX_FMT_BGR4_BYTE || target == AV_PIX_FMT_RGB4_BYTE

        || target == AV_PIX_FMT_BGR8      || target == AV_PIX_FMT_RGB8)

         step = 1;


     if (uvalpha < 2048) {

         int A = 0; //init to silence warning

         for (i = 0; i < dstW; i++) {

             int Y = buf0[i] << 2;

             int U = (ubuf0[i] - (128<<7)) * 4;

             int V = (vbuf0[i] - (128<<7)) * 4;


             if (hasAlpha) {

                 A = (abuf0[i] + 64) >> 7;

                 if (A & 0x100)

                     A = av_clip_uint8(A);

             }


             yuv2rgb_write_full(c, dest, i, Y, A, U, V, y, target, hasAlpha, err);

             dest += step;

         }

     } else {

         const int16_t *ubuf1 = ubuf[1], *vbuf1 = vbuf[1];

         int A = 0; //init to silence warning

         for (i = 0; i < dstW; i++) {

             int Y = buf0[i] << 2;

             int U = (ubuf0[i] + ubuf1[i] - (128<<8)) << 1;

             int V = (vbuf0[i] + vbuf1[i] - (128<<8)) << 1;


             if (hasAlpha) {

                 A = (abuf0[i] + 64) >> 7;

                 if (A & 0x100)

                     A = av_clip_uint8(A);

             }


             yuv2rgb_write_full(c, dest, i, Y, A, U, V, y, target, hasAlpha, err);

             dest += step;

         }

     }


     c->dither_error[0][i] = err[0];

     c->dither_error[1][i] = err[1];

     c->dither_error[2][i] = err[2];

 }


 #if CONFIG_SMALL

 YUV2RGBWRAPPER(yuv2, rgb_full, bgra32_full, AV_PIX_FMT_BGRA,  CONFIG_SWSCALE_ALPHA && c->needAlpha)

 YUV2RGBWRAPPER(yuv2, rgb_full, abgr32_full, AV_PIX_FMT_ABGR,  CONFIG_SWSCALE_ALPHA && c->needAlpha)

 YUV2RGBWRAPPER(yuv2, rgb_full, rgba32_full, AV_PIX_FMT_RGBA,  CONFIG_SWSCALE_ALPHA && c->needAlpha)

 YUV2RGBWRAPPER(yuv2, rgb_full, argb32_full, AV_PIX_FMT_ARGB,  CONFIG_SWSCALE_ALPHA && c->needAlpha)

 #else

 #if CONFIG_SWSCALE_ALPHA

 YUV2RGBWRAPPER(yuv2, rgb_full, bgra32_full, AV_PIX_FMT_BGRA,  1)

 YUV2RGBWRAPPER(yuv2, rgb_full, abgr32_full, AV_PIX_FMT_ABGR,  1)

 YUV2RGBWRAPPER(yuv2, rgb_full, rgba32_full, AV_PIX_FMT_RGBA,  1)

 YUV2RGBWRAPPER(yuv2, rgb_full, argb32_full, AV_PIX_FMT_ARGB,  1)

 #endif

 YUV2RGBWRAPPER(yuv2, rgb_full, bgrx32_full, AV_PIX_FMT_BGRA,  0)

 YUV2RGBWRAPPER(yuv2, rgb_full, xbgr32_full, AV_PIX_FMT_ABGR,  0)

 YUV2RGBWRAPPER(yuv2, rgb_full, rgbx32_full, AV_PIX_FMT_RGBA,  0)

 YUV2RGBWRAPPER(yuv2, rgb_full, xrgb32_full, AV_PIX_FMT_ARGB,  0)

 #endif

 YUV2RGBWRAPPER(yuv2, rgb_full, bgr24_full,  AV_PIX_FMT_BGR24, 0)

 YUV2RGBWRAPPER(yuv2, rgb_full, rgb24_full,  AV_PIX_FMT_RGB24, 0)


 YUV2RGBWRAPPER(yuv2, rgb_full, bgr4_byte_full,  AV_PIX_FMT_BGR4_BYTE, 0)

 YUV2RGBWRAPPER(yuv2, rgb_full, rgb4_byte_full,  AV_PIX_FMT_RGB4_BYTE, 0)

 YUV2RGBWRAPPER(yuv2, rgb_full, bgr8_full,   AV_PIX_FMT_BGR8,  0)

 YUV2RGBWRAPPER(yuv2, rgb_full, rgb8_full,   AV_PIX_FMT_RGB8,  0)


 static void

 yuv2gbrp_full_X_c(SwsContext *c, const int16_t *lumFilter,

                   const int16_t **lumSrc, int lumFilterSize,

                   const int16_t *chrFilter, const int16_t **chrUSrc,

                   const int16_t **chrVSrc, int chrFilterSize,

                   const int16_t **alpSrc, uint8_t **dest,

                   int dstW, int y)

 {

     const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(c->dstFormat);

     int i;

     int hasAlpha = (desc->flags & AV_PIX_FMT_FLAG_ALPHA) && alpSrc;

     uint16_t **dest16 = (uint16_t**)dest;

     int SH = 22 + 8 - desc->comp[0].depth;

     int A = 0; // init to silence warning


     for (i = 0; i < dstW; i++) {

         int j;

         int Y = 1 << 9;

         int U = (1 << 9) - (128 << 19);

         int V = (1 << 9) - (128 << 19);

         int R, G, B;


         for (j = 0; j < lumFilterSize; j++)

             Y += lumSrc[j][i] * lumFilter[j];


         for (j = 0; j < chrFilterSize; j++) {

             U += chrUSrc[j][i] * chrFilter[j];

             V += chrVSrc[j][i] * chrFilter[j];

         }


         Y >>= 10;

         U >>= 10;

         V >>= 10;


         if (hasAlpha) {

             A = 1 << 18;


             for (j = 0; j < lumFilterSize; j++)

                 A += alpSrc[j][i] * lumFilter[j];


             if (A & 0xF8000000)

                 A =  av_clip_uintp2(A, 27);

         }


         Y -= c->yuv2rgb_y_offset;

         Y *= c->yuv2rgb_y_coeff;

         Y += 1 << (SH-1);

         R = Y + V * c->yuv2rgb_v2r_coeff;

         G = Y + V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

         B = Y +                            U * c->yuv2rgb_u2b_coeff;


         if ((R | G | B) & 0xC0000000) {

             R = av_clip_uintp2(R, 30);

             G = av_clip_uintp2(G, 30);

             B = av_clip_uintp2(B, 30);

         }


         if (SH != 22) {

             dest16[0][i] = G >> SH;

             dest16[1][i] = B >> SH;

             dest16[2][i] = R >> SH;

             if (hasAlpha)

                 dest16[3][i] = A >> (SH - 3);

         } else {

             dest[0][i] = G >> 22;

             dest[1][i] = B >> 22;

             dest[2][i] = R >> 22;

             if (hasAlpha)

                 dest[3][i] = A >> 19;

         }

     }

     if (SH != 22 && (!isBE(c->dstFormat)) != (!HAVE_BIGENDIAN)) {

         for (i = 0; i < dstW; i++) {

             dest16[0][i] = av_bswap16(dest16[0][i]);

             dest16[1][i] = av_bswap16(dest16[1][i]);

             dest16[2][i] = av_bswap16(dest16[2][i]);

             if (hasAlpha)

                 dest16[3][i] = av_bswap16(dest16[3][i]);

         }

     }

 }


 static void

 yuv2gbrp16_full_X_c(SwsContext *c, const int16_t *lumFilter,

                     const int16_t **lumSrcx, int lumFilterSize,

                     const int16_t *chrFilter, const int16_t **chrUSrcx,

                     const int16_t **chrVSrcx, int chrFilterSize,

                     const int16_t **alpSrcx, uint8_t **dest,

                     int dstW, int y)

 {

     const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(c->dstFormat);

     int i;

     int hasAlpha = (desc->flags & AV_PIX_FMT_FLAG_ALPHA) && alpSrcx;

     uint16_t **dest16 = (uint16_t**)dest;

     const int32_t **lumSrc  = (const int32_t**)lumSrcx;

     const int32_t **chrUSrc = (const int32_t**)chrUSrcx;

     const int32_t **chrVSrc = (const int32_t**)chrVSrcx;

     const int32_t **alpSrc  = (const int32_t**)alpSrcx;


     for (i = 0; i < dstW; i++) {

         int j;

         int Y = -0x40000000;

         int U = -(128 << 23);

         int V = -(128 << 23);

         int R, G, B, A;


         for (j = 0; j < lumFilterSize; j++)

             Y += lumSrc[j][i] * (unsigned)lumFilter[j];


         for (j = 0; j < chrFilterSize; j++) {

             U += chrUSrc[j][i] * (unsigned)chrFilter[j];

             V += chrVSrc[j][i] * (unsigned)chrFilter[j];

         }


         Y >>= 14;

         Y += 0x10000;

         U >>= 14;

         V >>= 14;


         if (hasAlpha) {

             A = -0x40000000;


             for (j = 0; j < lumFilterSize; j++)

                 A += alpSrc[j][i] * lumFilter[j];


             A >>= 1;

             A += 0x20002000;

         }


         Y -= c->yuv2rgb_y_offset;

         Y *= c->yuv2rgb_y_coeff;

         Y += 1 << 13;

         R = V * c->yuv2rgb_v2r_coeff;

         G = V * c->yuv2rgb_v2g_coeff + U * c->yuv2rgb_u2g_coeff;

         B =                            U * c->yuv2rgb_u2b_coeff;


         R = av_clip_uintp2(Y + R, 30);

         G = av_clip_uintp2(Y + G, 30);

         B = av_clip_uintp2(Y + B, 30);


         dest16[0][i] = G >> 14;

         dest16[1][i] = B >> 14;

         dest16[2][i] = R >> 14;

         if (hasAlpha)

             dest16[3][i] = av_clip_uintp2(A, 30) >> 14;

     }

     if ((!isBE(c->dstFormat)) != (!HAVE_BIGENDIAN)) {

         for (i = 0; i < dstW; i++) {

             dest16[0][i] = av_bswap16(dest16[0][i]);

             dest16[1][i] = av_bswap16(dest16[1][i]);

             dest16[2][i] = av_bswap16(dest16[2][i]);

             if (hasAlpha)

                 dest16[3][i] = av_bswap16(dest16[3][i]);

         }

     }

 }


 static void

 yuv2ya8_1_c(SwsContext *c, const int16_t *buf0,

             const int16_t *ubuf[2], const int16_t *vbuf[2],

             const int16_t *abuf0, uint8_t *dest, int dstW,

             int uvalpha, int y)

 {

     int hasAlpha = !!abuf0;

     int i;


     for (i = 0; i < dstW; i++) {

         int Y = (buf0[i] + 64) >> 7;

         int A;


         Y = av_clip_uint8(Y);


         if (hasAlpha) {

             A = (abuf0[i] + 64) >> 7;

             if (A & 0x100)

                 A = av_clip_uint8(A);

         }


         dest[i * 2    ] = Y;

         dest[i * 2 + 1] = hasAlpha ? A : 255;

     }

 }


 static void

 yuv2ya8_2_c(SwsContext *c, const int16_t *buf[2],

             const int16_t *ubuf[2], const int16_t *vbuf[2],

             const int16_t *abuf[2], uint8_t *dest, int dstW,

             int yalpha, int uvalpha, int y)

 {

     int hasAlpha = abuf && abuf[0] && abuf[1];

     const int16_t *buf0  = buf[0],  *buf1  = buf[1],

                   *abuf0 = hasAlpha ? abuf[0] : NULL,

                   *abuf1 = hasAlpha ? abuf[1] : NULL;

     int  yalpha1 = 4096 - yalpha;

     int i;


     av_assert2(yalpha  <= 4096U);


     for (i = 0; i < dstW; i++) {

         int Y = (buf0[i] * yalpha1 + buf1[i] * yalpha) >> 19;

         int A;


         Y = av_clip_uint8(Y);


         if (hasAlpha) {

             A = (abuf0[i] * yalpha1 + abuf1[i] * yalpha) >> 19;

             A = av_clip_uint8(A);

         }


         dest[i * 2    ] = Y;

         dest[i * 2 + 1] = hasAlpha ? A : 255;

     }

 }


 static void

 yuv2ya8_X_c(SwsContext *c, const int16_t *lumFilter,

             const int16_t **lumSrc, int lumFilterSize,

             const int16_t *chrFilter, const int16_t **chrUSrc,

             const int16_t **chrVSrc, int chrFilterSize,

             const int16_t **alpSrc, uint8_t *dest, int dstW, int y)

 {

     int hasAlpha = !!alpSrc;

     int i;


     for (i = 0; i < dstW; i++) {

         int j;

         int Y = 1 << 18, A = 1 << 18;


         for (j = 0; j < lumFilterSize; j++)

             Y += lumSrc[j][i] * lumFilter[j];


         Y >>= 19;

         if (Y  & 0x100)

             Y = av_clip_uint8(Y);


         if (hasAlpha) {

             for (j = 0; j < lumFilterSize; j++)

                 A += alpSrc[j][i] * lumFilter[j];


             A >>= 19;


             if (A & 0x100)

                 A = av_clip_uint8(A);

         }


         dest[2 * i    ] = Y;

         dest[2 * i + 1] = hasAlpha ? A : 255;

     }

 }


 static void

 yuv2ayuv64le_X_c(SwsContext *c, const int16_t *lumFilter,

                  const int16_t **_lumSrc, int lumFilterSize,

                  const int16_t *chrFilter, const int16_t **_chrUSrc,

                  const int16_t **_chrVSrc, int chrFilterSize,

                  const int16_t **_alpSrc, uint8_t *dest, int dstW, int y)

 {

     const int32_t **lumSrc  = (const int32_t **) _lumSrc,

                   **chrUSrc = (const int32_t **) _chrUSrc,

                   **chrVSrc = (const int32_t **) _chrVSrc,

                   **alpSrc  = (const int32_t **) _alpSrc;

     int hasAlpha = !!alpSrc;

     int i;


     for (i = 0; i < dstW; i++) {

         int Y = 1 << 14, U = 1 << 14;

         int V = 1 << 14, A = 1 << 14;

         int j;


         Y -= 0x40000000;

         U -= 0x40000000;

         V -= 0x40000000;

         A -= 0x40000000;


         for (j = 0; j < lumFilterSize; j++)

             Y += lumSrc[j][i] * (unsigned)lumFilter[j];


         for (j = 0; j < chrFilterSize; j++)

             U += chrUSrc[j][i] * (unsigned)chrFilter[j];


         for (j = 0; j < chrFilterSize; j++)

             V += chrVSrc[j][i] * (unsigned)chrFilter[j];


         if (hasAlpha)

             for (j = 0; j < lumFilterSize; j++)

                 A += alpSrc[j][i] * (unsigned)lumFilter[j];


         Y = 0x8000 + av_clip_int16(Y >> 15);

         U = 0x8000 + av_clip_int16(U >> 15);

         V = 0x8000 + av_clip_int16(V >> 15);

         A = 0x8000 + av_clip_int16(A >> 15);


         AV_WL16(dest + 8 * i, hasAlpha ? A : 65535);

         AV_WL16(dest + 8 * i + 2, Y);

         AV_WL16(dest + 8 * i + 4, U);

         AV_WL16(dest + 8 * i + 6, V);

     }

 }


 av_cold void ff_sws_init_output_funcs(SwsContext *c,

                                       yuv2planar1_fn *yuv2plane1,

                                       yuv2planarX_fn *yuv2planeX,

                                       yuv2interleavedX_fn *yuv2nv12cX,

                                       yuv2packed1_fn *yuv2packed1,

                                       yuv2packed2_fn *yuv2packed2,

                                       yuv2packedX_fn *yuv2packedX,

                                       yuv2anyX_fn *yuv2anyX)

 {

     enum AVPixelFormat dstFormat = c->dstFormat;

     const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(dstFormat);


     if (dstFormat == AV_PIX_FMT_P010LE || dstFormat == AV_PIX_FMT_P010BE) {

         *yuv2plane1 = isBE(dstFormat) ? yuv2p010l1_BE_c : yuv2p010l1_LE_c;

         *yuv2planeX = isBE(dstFormat) ? yuv2p010lX_BE_c : yuv2p010lX_LE_c;

         *yuv2nv12cX = yuv2p010cX_c;

     } else if (is16BPS(dstFormat)) {

         *yuv2planeX = isBE(dstFormat) ? yuv2planeX_16BE_c  : yuv2planeX_16LE_c;

         *yuv2plane1 = isBE(dstFormat) ? yuv2plane1_16BE_c  : yuv2plane1_16LE_c;

         if (dstFormat == AV_PIX_FMT_P016LE || dstFormat == AV_PIX_FMT_P016BE) {

           *yuv2nv12cX = yuv2p016cX_c;

         }

     } else if (isNBPS(dstFormat)) {

         if (desc->comp[0].depth == 9) {

             *yuv2planeX = isBE(dstFormat) ? yuv2planeX_9BE_c  : yuv2planeX_9LE_c;

             *yuv2plane1 = isBE(dstFormat) ? yuv2plane1_9BE_c  : yuv2plane1_9LE_c;

         } else if (desc->comp[0].depth == 10) {

             *yuv2planeX = isBE(dstFormat) ? yuv2planeX_10BE_c  : yuv2planeX_10LE_c;

             *yuv2plane1 = isBE(dstFormat) ? yuv2plane1_10BE_c  : yuv2plane1_10LE_c;

         } else if (desc->comp[0].depth == 12) {

             *yuv2planeX = isBE(dstFormat) ? yuv2planeX_12BE_c  : yuv2planeX_12LE_c;

             *yuv2plane1 = isBE(dstFormat) ? yuv2plane1_12BE_c  : yuv2plane1_12LE_c;

         } else if (desc->comp[0].depth == 14) {

             *yuv2planeX = isBE(dstFormat) ? yuv2planeX_14BE_c  : yuv2planeX_14LE_c;

             *yuv2plane1 = isBE(dstFormat) ? yuv2plane1_14BE_c  : yuv2plane1_14LE_c;

         } else

             av_assert0(0);

     } else {

         *yuv2plane1 = yuv2plane1_8_c;

         *yuv2planeX = yuv2planeX_8_c;

         if (dstFormat == AV_PIX_FMT_NV12 || dstFormat == AV_PIX_FMT_NV21)

             *yuv2nv12cX = yuv2nv12cX_c;

     }


     if(c->flags & SWS_FULL_CHR_H_INT) {

         switch (dstFormat) {

             case AV_PIX_FMT_RGBA:

 #if CONFIG_SMALL

                 *yuv2packedX = yuv2rgba32_full_X_c;

                 *yuv2packed2 = yuv2rgba32_full_2_c;

                 *yuv2packed1 = yuv2rgba32_full_1_c;

 #else

 #if CONFIG_SWSCALE_ALPHA

                 if (c->needAlpha) {

                     *yuv2packedX = yuv2rgba32_full_X_c;

                     *yuv2packed2 = yuv2rgba32_full_2_c;

                     *yuv2packed1 = yuv2rgba32_full_1_c;

                 } else

 #endif /* CONFIG_SWSCALE_ALPHA */

                 {

                     *yuv2packedX = yuv2rgbx32_full_X_c;

                     *yuv2packed2 = yuv2rgbx32_full_2_c;

                     *yuv2packed1 = yuv2rgbx32_full_1_c;

                 }

 #endif /* !CONFIG_SMALL */

                 break;

             case AV_PIX_FMT_ARGB:

 #if CONFIG_SMALL

                 *yuv2packedX = yuv2argb32_full_X_c;

                 *yuv2packed2 = yuv2argb32_full_2_c;

                 *yuv2packed1 = yuv2argb32_full_1_c;

 #else

 #if CONFIG_SWSCALE_ALPHA

                 if (c->needAlpha) {

                     *yuv2packedX = yuv2argb32_full_X_c;

                     *yuv2packed2 = yuv2argb32_full_2_c;

                     *yuv2packed1 = yuv2argb32_full_1_c;

                 } else

 #endif /* CONFIG_SWSCALE_ALPHA */

                 {

                     *yuv2packedX = yuv2xrgb32_full_X_c;

                     *yuv2packed2 = yuv2xrgb32_full_2_c;

                     *yuv2packed1 = yuv2xrgb32_full_1_c;

                 }

 #endif /* !CONFIG_SMALL */

                 break;

             case AV_PIX_FMT_BGRA:

 #if CONFIG_SMALL

                 *yuv2packedX = yuv2bgra32_full_X_c;

                 *yuv2packed2 = yuv2bgra32_full_2_c;

                 *yuv2packed1 = yuv2bgra32_full_1_c;

 #else

 #if CONFIG_SWSCALE_ALPHA

                 if (c->needAlpha) {

                     *yuv2packedX = yuv2bgra32_full_X_c;

                     *yuv2packed2 = yuv2bgra32_full_2_c;

                     *yuv2packed1 = yuv2bgra32_full_1_c;

                 } else

 #endif /* CONFIG_SWSCALE_ALPHA */

                 {

                     *yuv2packedX = yuv2bgrx32_full_X_c;

                     *yuv2packed2 = yuv2bgrx32_full_2_c;

                     *yuv2packed1 = yuv2bgrx32_full_1_c;

                 }

 #endif /* !CONFIG_SMALL */

                 break;

             case AV_PIX_FMT_ABGR:

 #if CONFIG_SMALL

                 *yuv2packedX = yuv2abgr32_full_X_c;

                 *yuv2packed2 = yuv2abgr32_full_2_c;

                 *yuv2packed1 = yuv2abgr32_full_1_c;

 #else

 #if CONFIG_SWSCALE_ALPHA

                 if (c->needAlpha) {

                     *yuv2packedX = yuv2abgr32_full_X_c;

                     *yuv2packed2 = yuv2abgr32_full_2_c;

                     *yuv2packed1 = yuv2abgr32_full_1_c;

                 } else

 #endif /* CONFIG_SWSCALE_ALPHA */

                 {

                     *yuv2packedX = yuv2xbgr32_full_X_c;

                     *yuv2packed2 = yuv2xbgr32_full_2_c;

                     *yuv2packed1 = yuv2xbgr32_full_1_c;

                 }

 #endif /* !CONFIG_SMALL */

                 break;

         case AV_PIX_FMT_RGBA64LE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packedX = yuv2rgba64le_full_X_c;

                 *yuv2packed2 = yuv2rgba64le_full_2_c;

                 *yuv2packed1 = yuv2rgba64le_full_1_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packedX = yuv2rgbx64le_full_X_c;

                 *yuv2packed2 = yuv2rgbx64le_full_2_c;

                 *yuv2packed1 = yuv2rgbx64le_full_1_c;

             }

             break;

         case AV_PIX_FMT_RGBA64BE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packedX = yuv2rgba64be_full_X_c;

                 *yuv2packed2 = yuv2rgba64be_full_2_c;

                 *yuv2packed1 = yuv2rgba64be_full_1_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packedX = yuv2rgbx64be_full_X_c;

                 *yuv2packed2 = yuv2rgbx64be_full_2_c;

                 *yuv2packed1 = yuv2rgbx64be_full_1_c;

             }

             break;

         case AV_PIX_FMT_BGRA64LE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packedX = yuv2bgra64le_full_X_c;

                 *yuv2packed2 = yuv2bgra64le_full_2_c;

                 *yuv2packed1 = yuv2bgra64le_full_1_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packedX = yuv2bgrx64le_full_X_c;

                 *yuv2packed2 = yuv2bgrx64le_full_2_c;

                 *yuv2packed1 = yuv2bgrx64le_full_1_c;

             }

             break;

         case AV_PIX_FMT_BGRA64BE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packedX = yuv2bgra64be_full_X_c;

                 *yuv2packed2 = yuv2bgra64be_full_2_c;

                 *yuv2packed1 = yuv2bgra64be_full_1_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packedX = yuv2bgrx64be_full_X_c;

                 *yuv2packed2 = yuv2bgrx64be_full_2_c;

                 *yuv2packed1 = yuv2bgrx64be_full_1_c;

             }

             break;


         case AV_PIX_FMT_RGB24:

             *yuv2packedX = yuv2rgb24_full_X_c;

             *yuv2packed2 = yuv2rgb24_full_2_c;

             *yuv2packed1 = yuv2rgb24_full_1_c;

             break;

         case AV_PIX_FMT_BGR24:

             *yuv2packedX = yuv2bgr24_full_X_c;

             *yuv2packed2 = yuv2bgr24_full_2_c;

             *yuv2packed1 = yuv2bgr24_full_1_c;

             break;

         case AV_PIX_FMT_RGB48LE:

             *yuv2packedX = yuv2rgb48le_full_X_c;

             *yuv2packed2 = yuv2rgb48le_full_2_c;

             *yuv2packed1 = yuv2rgb48le_full_1_c;

             break;

         case AV_PIX_FMT_BGR48LE:

             *yuv2packedX = yuv2bgr48le_full_X_c;

             *yuv2packed2 = yuv2bgr48le_full_2_c;

             *yuv2packed1 = yuv2bgr48le_full_1_c;

             break;

         case AV_PIX_FMT_RGB48BE:

             *yuv2packedX = yuv2rgb48be_full_X_c;

             *yuv2packed2 = yuv2rgb48be_full_2_c;

             *yuv2packed1 = yuv2rgb48be_full_1_c;

             break;

         case AV_PIX_FMT_BGR48BE:

             *yuv2packedX = yuv2bgr48be_full_X_c;

             *yuv2packed2 = yuv2bgr48be_full_2_c;

             *yuv2packed1 = yuv2bgr48be_full_1_c;

             break;

         case AV_PIX_FMT_BGR4_BYTE:

             *yuv2packedX = yuv2bgr4_byte_full_X_c;

             *yuv2packed2 = yuv2bgr4_byte_full_2_c;

             *yuv2packed1 = yuv2bgr4_byte_full_1_c;

             break;

         case AV_PIX_FMT_RGB4_BYTE:

             *yuv2packedX = yuv2rgb4_byte_full_X_c;

             *yuv2packed2 = yuv2rgb4_byte_full_2_c;

             *yuv2packed1 = yuv2rgb4_byte_full_1_c;

             break;

         case AV_PIX_FMT_BGR8:

             *yuv2packedX = yuv2bgr8_full_X_c;

             *yuv2packed2 = yuv2bgr8_full_2_c;

             *yuv2packed1 = yuv2bgr8_full_1_c;

             break;

         case AV_PIX_FMT_RGB8:

             *yuv2packedX = yuv2rgb8_full_X_c;

             *yuv2packed2 = yuv2rgb8_full_2_c;

             *yuv2packed1 = yuv2rgb8_full_1_c;

             break;

         case AV_PIX_FMT_GBRP:

         case AV_PIX_FMT_GBRP9BE:

         case AV_PIX_FMT_GBRP9LE:

         case AV_PIX_FMT_GBRP10BE:

         case AV_PIX_FMT_GBRP10LE:

         case AV_PIX_FMT_GBRP12BE:

         case AV_PIX_FMT_GBRP12LE:

         case AV_PIX_FMT_GBRP14BE:

         case AV_PIX_FMT_GBRP14LE:

         case AV_PIX_FMT_GBRAP:

         case AV_PIX_FMT_GBRAP10BE:

         case AV_PIX_FMT_GBRAP10LE:

         case AV_PIX_FMT_GBRAP12BE:

         case AV_PIX_FMT_GBRAP12LE:

             *yuv2anyX = yuv2gbrp_full_X_c;

             break;

         case AV_PIX_FMT_GBRP16BE:

         case AV_PIX_FMT_GBRP16LE:

         case AV_PIX_FMT_GBRAP16BE:

         case AV_PIX_FMT_GBRAP16LE:

             *yuv2anyX = yuv2gbrp16_full_X_c;

             break;

         }

         if (!*yuv2packedX && !*yuv2anyX)

             goto YUV_PACKED;

     } else {

         YUV_PACKED:

         switch (dstFormat) {

         case AV_PIX_FMT_RGBA64LE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packed1 = yuv2rgba64le_1_c;

                 *yuv2packed2 = yuv2rgba64le_2_c;

                 *yuv2packedX = yuv2rgba64le_X_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packed1 = yuv2rgbx64le_1_c;

                 *yuv2packed2 = yuv2rgbx64le_2_c;

                 *yuv2packedX = yuv2rgbx64le_X_c;

             }

             break;

         case AV_PIX_FMT_RGBA64BE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packed1 = yuv2rgba64be_1_c;

                 *yuv2packed2 = yuv2rgba64be_2_c;

                 *yuv2packedX = yuv2rgba64be_X_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packed1 = yuv2rgbx64be_1_c;

                 *yuv2packed2 = yuv2rgbx64be_2_c;

                 *yuv2packedX = yuv2rgbx64be_X_c;

             }

             break;

         case AV_PIX_FMT_BGRA64LE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packed1 = yuv2bgra64le_1_c;

                 *yuv2packed2 = yuv2bgra64le_2_c;

                 *yuv2packedX = yuv2bgra64le_X_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packed1 = yuv2bgrx64le_1_c;

                 *yuv2packed2 = yuv2bgrx64le_2_c;

                 *yuv2packedX = yuv2bgrx64le_X_c;

             }

             break;

         case AV_PIX_FMT_BGRA64BE:

 #if CONFIG_SWSCALE_ALPHA

             if (c->needAlpha) {

                 *yuv2packed1 = yuv2bgra64be_1_c;

                 *yuv2packed2 = yuv2bgra64be_2_c;

                 *yuv2packedX = yuv2bgra64be_X_c;

             } else

 #endif /* CONFIG_SWSCALE_ALPHA */

             {

                 *yuv2packed1 = yuv2bgrx64be_1_c;

                 *yuv2packed2 = yuv2bgrx64be_2_c;

                 *yuv2packedX = yuv2bgrx64be_X_c;

             }

             break;

         case AV_PIX_FMT_RGB48LE:

             *yuv2packed1 = yuv2rgb48le_1_c;

             *yuv2packed2 = yuv2rgb48le_2_c;

             *yuv2packedX = yuv2rgb48le_X_c;

             break;

         case AV_PIX_FMT_RGB48BE:

             *yuv2packed1 = yuv2rgb48be_1_c;

             *yuv2packed2 = yuv2rgb48be_2_c;

             *yuv2packedX = yuv2rgb48be_X_c;

             break;

         case AV_PIX_FMT_BGR48LE:

             *yuv2packed1 = yuv2bgr48le_1_c;

             *yuv2packed2 = yuv2bgr48le_2_c;

             *yuv2packedX = yuv2bgr48le_X_c;

             break;

         case AV_PIX_FMT_BGR48BE:

             *yuv2packed1 = yuv2bgr48be_1_c;

             *yuv2packed2 = yuv2bgr48be_2_c;

             *yuv2packedX = yuv2bgr48be_X_c;

             break;

         case AV_PIX_FMT_RGB32:

         case AV_PIX_FMT_BGR32:

 #if CONFIG_SMALL

             *yuv2packed1 = yuv2rgb32_1_c;

             *yuv2packed2 = yuv2rgb32_2_c;

             *yuv2packedX = yuv2rgb32_X_c;

 #else

 #if CONFIG_SWSCALE_ALPHA

                 if (c->needAlpha) {

                     *yuv2packed1 = yuv2rgba32_1_c;

                     *yuv2packed2 = yuv2rgba32_2_c;

                     *yuv2packedX = yuv2rgba32_X_c;

                 } else

 #endif /* CONFIG_SWSCALE_ALPHA */

                 {

                     *yuv2packed1 = yuv2rgbx32_1_c;

                     *yuv2packed2 = yuv2rgbx32_2_c;

                     *yuv2packedX = yuv2rgbx32_X_c;

                 }

 #endif /* !CONFIG_SMALL */

             break;

         case AV_PIX_FMT_RGB32_1:

         case AV_PIX_FMT_BGR32_1:

 #if CONFIG_SMALL

                 *yuv2packed1 = yuv2rgb32_1_1_c;

                 *yuv2packed2 = yuv2rgb32_1_2_c;

                 *yuv2packedX = yuv2rgb32_1_X_c;

 #else

 #if CONFIG_SWSCALE_ALPHA

                 if (c->needAlpha) {

                     *yuv2packed1 = yuv2rgba32_1_1_c;

                     *yuv2packed2 = yuv2rgba32_1_2_c;

                     *yuv2packedX = yuv2rgba32_1_X_c;

                 } else

 #endif /* CONFIG_SWSCALE_ALPHA */

                 {

                     *yuv2packed1 = yuv2rgbx32_1_1_c;

                     *yuv2packed2 = yuv2rgbx32_1_2_c;

                     *yuv2packedX = yuv2rgbx32_1_X_c;

                 }

 #endif /* !CONFIG_SMALL */

                 break;

         case AV_PIX_FMT_RGB24:

             *yuv2packed1 = yuv2rgb24_1_c;

             *yuv2packed2 = yuv2rgb24_2_c;

             *yuv2packedX = yuv2rgb24_X_c;

             break;

         case AV_PIX_FMT_BGR24:

             *yuv2packed1 = yuv2bgr24_1_c;

             *yuv2packed2 = yuv2bgr24_2_c;

             *yuv2packedX = yuv2bgr24_X_c;

             break;

         case AV_PIX_FMT_RGB565LE:

         case AV_PIX_FMT_RGB565BE:

         case AV_PIX_FMT_BGR565LE:

         case AV_PIX_FMT_BGR565BE:

             *yuv2packed1 = yuv2rgb16_1_c;

             *yuv2packed2 = yuv2rgb16_2_c;

             *yuv2packedX = yuv2rgb16_X_c;

             break;

         case AV_PIX_FMT_RGB555LE:

         case AV_PIX_FMT_RGB555BE:

         case AV_PIX_FMT_BGR555LE:

         case AV_PIX_FMT_BGR555BE:

             *yuv2packed1 = yuv2rgb15_1_c;

             *yuv2packed2 = yuv2rgb15_2_c;

             *yuv2packedX = yuv2rgb15_X_c;

             break;

         case AV_PIX_FMT_RGB444LE:

         case AV_PIX_FMT_RGB444BE:

         case AV_PIX_FMT_BGR444LE:

         case AV_PIX_FMT_BGR444BE:

             *yuv2packed1 = yuv2rgb12_1_c;

             *yuv2packed2 = yuv2rgb12_2_c;

             *yuv2packedX = yuv2rgb12_X_c;

             break;

         case AV_PIX_FMT_RGB8:

         case AV_PIX_FMT_BGR8:

             *yuv2packed1 = yuv2rgb8_1_c;

             *yuv2packed2 = yuv2rgb8_2_c;

             *yuv2packedX = yuv2rgb8_X_c;

             break;

         case AV_PIX_FMT_RGB4:

         case AV_PIX_FMT_BGR4:

             *yuv2packed1 = yuv2rgb4_1_c;

             *yuv2packed2 = yuv2rgb4_2_c;

             *yuv2packedX = yuv2rgb4_X_c;

             break;

         case AV_PIX_FMT_RGB4_BYTE:

         case AV_PIX_FMT_BGR4_BYTE:

             *yuv2packed1 = yuv2rgb4b_1_c;

             *yuv2packed2 = yuv2rgb4b_2_c;

             *yuv2packedX = yuv2rgb4b_X_c;

             break;

         }

     }

     switch (dstFormat) {

     case AV_PIX_FMT_MONOWHITE:

         *yuv2packed1 = yuv2monowhite_1_c;

         *yuv2packed2 = yuv2monowhite_2_c;

         *yuv2packedX = yuv2monowhite_X_c;

         break;

     case AV_PIX_FMT_MONOBLACK:

         *yuv2packed1 = yuv2monoblack_1_c;

         *yuv2packed2 = yuv2monoblack_2_c;

         *yuv2packedX = yuv2monoblack_X_c;

         break;

     case AV_PIX_FMT_YUYV422:

         *yuv2packed1 = yuv2yuyv422_1_c;

         *yuv2packed2 = yuv2yuyv422_2_c;

         *yuv2packedX = yuv2yuyv422_X_c;

         break;

     case AV_PIX_FMT_YVYU422:

         *yuv2packed1 = yuv2yvyu422_1_c;

         *yuv2packed2 = yuv2yvyu422_2_c;

         *yuv2packedX = yuv2yvyu422_X_c;

         break;

     case AV_PIX_FMT_UYVY422:

         *yuv2packed1 = yuv2uyvy422_1_c;

         *yuv2packed2 = yuv2uyvy422_2_c;

         *yuv2packedX = yuv2uyvy422_X_c;

         break;

     case AV_PIX_FMT_YA8:

         *yuv2packed1 = yuv2ya8_1_c;

         *yuv2packed2 = yuv2ya8_2_c;

         *yuv2packedX = yuv2ya8_X_c;

         break;

     case AV_PIX_FMT_AYUV64LE:

         *yuv2packedX = yuv2ayuv64le_X_c;

         break;

     }

 }

AV_PIX_FMT_UYVY422
packed YUV 4:2:2, 16bpp, Cb Y0 Cr Y1
Definition: pixfmt.h:77

math.h

AV_PIX_FMT_GBRAP10LE
planar GBR 4:4:4:4 40bpp, little-endian
Definition: pixfmt.h:287

NULL
#define NULL
Definition: coverity.c:32

val
const char const char void * val
Definition: avisynth_c.h:771

yuv2rgb_1_c_template
static av_always_inline void yuv2rgb_1_c_template(SwsContext *c, const int16_t *buf0, const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf0, uint8_t *dest, int dstW, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha)
Definition: output.c:1545

yuv2ayuv64le_X_c
static void yuv2ayuv64le_X_c(SwsContext *c, const int16_t *lumFilter, const int16_t **_lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **_chrUSrc, const int16_t **_chrVSrc, int chrFilterSize, const int16_t **_alpSrc, uint8_t *dest, int dstW, int y)
Definition: output.c:2221

rgb2rgb.h

SwsContext::yuv2rgb_u2g_coeff
int yuv2rgb_u2g_coeff
Definition: swscale_internal.h:435

ff_sws_init_output_funcs
av_cold void ff_sws_init_output_funcs(SwsContext *c, yuv2planar1_fn *yuv2plane1, yuv2planarX_fn *yuv2planeX, yuv2interleavedX_fn *yuv2nv12cX, yuv2packed1_fn *yuv2packed1, yuv2packed2_fn *yuv2packed2, yuv2packedX_fn *yuv2packedX, yuv2anyX_fn *yuv2anyX)
Definition: output.c:2269

yuv2gbrp16_full_X_c
static void yuv2gbrp16_full_X_c(SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrcx, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrcx, const int16_t **chrVSrcx, int chrFilterSize, const int16_t **alpSrcx, uint8_t **dest, int dstW, int y)
Definition: output.c:2053

shift
static int shift(int a, int b)
Definition: sonic.c:82

av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2363

YUVRGB_TABLE_HEADROOM
#define YUVRGB_TABLE_HEADROOM
Definition: swscale_internal.h:38

X_DITHER
#define X_DITHER(u, v)

yuv2p010lX_BE_c
static void yuv2p010lX_BE_c(const int16_t *filter, int filterSize, const int16_t **src, uint8_t *dest, int dstW, const uint8_t *dither, int offset)
Definition: output.c:424

AV_PIX_FMT_YA8
8 bits gray, 8 bits alpha
Definition: pixfmt.h:139

AV_PIX_FMT_BGRA64LE
packed RGBA 16:16:16:16, 64bpp, 16B, 16G, 16R, 16A, the 2-byte value for each R/G/B/A component is st...
Definition: pixfmt.h:204

A1
#define A1
Definition: binkdsp.c:31

AV_PIX_FMT_RGB24
packed RGB 8:8:8, 24bpp, RGBRGB...
Definition: pixfmt.h:64

AV_PIX_FMT_BGR4
packed RGB 1:2:1 bitstream, 4bpp, (msb)1B 2G 1R(lsb), a byte contains two pixels, the first pixel in ...
Definition: pixfmt.h:80

g
const char * g
Definition: vf_curves.c:112

desc
const char * desc
Definition: nvenc.c:65

accumulate_bit
#define accumulate_bit(acc, val)
Definition: output.c:434

acc
int acc
Definition: yuv2rgb.c:554

yuv2rgb
static void yuv2rgb(uint8_t *out, int ridx, int Y, int U, int V)
Definition: g2meet.c:277

ff_dither_2x2_8
const uint8_t ff_dither_2x2_8[][8]
Definition: output.c:45

yuv2rgb_full_1_c_template
static av_always_inline void yuv2rgb_full_1_c_template(SwsContext *c, const int16_t *buf0, const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf0, uint8_t *dest, int dstW, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha)
Definition: output.c:1890

AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:164

AV_PIX_FMT_RGB555LE
packed RGB 5:5:5, 16bpp, (msb)1X 5R 5G 5B(lsb), little-endian, X=unused/undefined ...
Definition: pixfmt.h:104

AV_PIX_FMT_BGRA64BE
packed RGBA 16:16:16:16, 64bpp, 16B, 16G, 16R, 16A, the 2-byte value for each R/G/B/A component is st...
Definition: pixfmt.h:203

b
const char * b
Definition: vf_curves.c:113

yuv2p010l1_LE_c
static void yuv2p010l1_LE_c(const int16_t *src, uint8_t *dest, int dstW, const uint8_t *dither, int offset)
Definition: output.c:403

SwsContext::table_bU
uint8_t * table_bU[256+2 *YUVRGB_TABLE_HEADROOM]
Definition: swscale_internal.h:402

av_bswap16
#define av_bswap16
Definition: bswap.h:31

is16BPS
static av_always_inline int is16BPS(enum AVPixelFormat pix_fmt)
Definition: swscale_internal.h:644

avutil.h
Convenience header that includes libavutil's core.

AV_PIX_FMT_BGR565LE
packed BGR 5:6:5, 16bpp, (msb) 5B 6G 5R(lsb), little-endian
Definition: pixfmt.h:107

AV_PIX_FMT_GBRP12LE
planar GBR 4:4:4 36bpp, little-endian
Definition: pixfmt.h:251

AV_PIX_FMT_RGB444BE
packed RGB 4:4:4, 16bpp, (msb)4X 4R 4G 4B(lsb), big-endian, X=unused/undefined
Definition: pixfmt.h:136

AV_PIX_FMT_RGB444
#define AV_PIX_FMT_RGB444
Definition: pixfmt.h:357

src
#define src
Definition: vp8dsp.c:254

AV_PIX_FMT_GBRP12BE
planar GBR 4:4:4 36bpp, big-endian
Definition: pixfmt.h:250

ff_dither_8x8_220
const uint8_t ff_dither_8x8_220[][8]
Definition: output.c:84

yuv2plane1_16_c_template
static av_always_inline void yuv2plane1_16_c_template(const int32_t *src, uint16_t *dest, int dstW, int big_endian, int output_bits)
Definition: output.c:144

r_b
#define r_b

yuv2planeX_16_c_template
static av_always_inline void yuv2planeX_16_c_template(const int16_t *filter, int filterSize, const int32_t **src, uint16_t *dest, int dstW, int big_endian, int output_bits)
Definition: output.c:158

AV_PIX_FMT_RGB4
packed RGB 1:2:1 bitstream, 4bpp, (msb)1R 2G 1B(lsb), a byte contains two pixels, the first pixel in ...
Definition: pixfmt.h:83

output_pixels
#define output_pixels(pos, Y1, U, Y2, V)
Definition: output.c:644

attributes.h
Macro definitions for various function/variable attributes.

b_r
#define b_r

AV_PIX_FMT_RGB565LE
packed RGB 5:6:5, 16bpp, (msb) 5R 6G 5B(lsb), little-endian
Definition: pixfmt.h:102

AV_PIX_FMT_BGR4_BYTE
packed RGB 1:2:1, 8bpp, (msb)1B 2G 1R(lsb)
Definition: pixfmt.h:81

mathematics.h

ff_dither_8x8_32
const uint8_t ff_dither_8x8_32[][8]
Definition: output.c:59

AV_PIX_FMT_GBRAP16BE
planar GBRA 4:4:4:4 64bpp, big-endian
Definition: pixfmt.h:212

av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:37

ff_dither_2x2_4
const uint8_t ff_dither_2x2_4[][8]
Definition: output.c:39

filter
static void filter(int16_t *output, ptrdiff_t out_stride, int16_t *low, ptrdiff_t low_stride, int16_t *high, ptrdiff_t high_stride, int len, int clip)
Definition: cfhd.c:114

yuv2interleavedX_fn
void(* yuv2interleavedX_fn)(struct SwsContext *c, const int16_t *chrFilter, int chrFilterSize, const int16_t **chrUSrc, const int16_t **chrVSrc, uint8_t *dest, int dstW)
Write one line of horizontally scaled chroma to interleaved output with multi-point vertical scaling ...
Definition: swscale_internal.h:133

AVPixFmtDescriptor::comp
AVComponentDescriptor comp[4]
Parameters that describe how pixels are packed.
Definition: pixdesc.h:117

config.h

uint8_t
uint8_t
Definition: audio_convert.c:194

av_cold
#define av_cold
Definition: attributes.h:82

AV_PIX_FMT_FLAG_ALPHA
#define AV_PIX_FMT_FLAG_ALPHA
The pixel format has an alpha channel.
Definition: pixdesc.h:181

av_assert2
#define av_assert2(cond)
assert() equivalent, that does lie in speed critical code.
Definition: avassert.h:64

ff_dither_4x4_16
const uint8_t ff_dither_4x4_16[][8]
Definition: output.c:51

SwsContext::yuv2rgb_y_coeff
int yuv2rgb_y_coeff
Definition: swscale_internal.h:432

AV_PIX_FMT_RGB48LE
packed RGB 16:16:16, 48bpp, 16R, 16G, 16B, the 2-byte value for each R/G/B component is stored as lit...
Definition: pixfmt.h:99

Y
#define Y
Definition: vf_boxblur.c:76

yuv2anyX_fn
void(* yuv2anyX_fn)(struct SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t **dest, int dstW, int y)
Write one line of horizontally scaled Y/U/V/A to YUV/RGB output by doing multi-point vertical scaling...
Definition: swscale_internal.h:268

AV_PIX_FMT_RGBA64BE
packed RGBA 16:16:16:16, 64bpp, 16R, 16G, 16B, 16A, the 2-byte value for each R/G/B/A component is st...
Definition: pixfmt.h:201

yuv2ya8_2_c
static void yuv2ya8_2_c(SwsContext *c, const int16_t *buf[2], const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf[2], uint8_t *dest, int dstW, int yalpha, int uvalpha, int y)
Definition: output.c:2154

AV_PIX_FMT_RGB444LE
packed RGB 4:4:4, 16bpp, (msb)4X 4R 4G 4B(lsb), little-endian, X=unused/undefined ...
Definition: pixfmt.h:135

SWS_FULL_CHR_H_INT
#define SWS_FULL_CHR_H_INT
Definition: swscale.h:79

u
#define u(width, name, range_min, range_max)
Definition: cbs_h2645.c:344

AV_PIX_FMT_RGB565BE
packed RGB 5:6:5, 16bpp, (msb) 5R 6G 5B(lsb), big-endian
Definition: pixfmt.h:101

AV_PIX_FMT_ABGR
packed ABGR 8:8:8:8, 32bpp, ABGRABGR...
Definition: pixfmt.h:90

yuv2gbrp_full_X_c
static void yuv2gbrp_full_X_c(SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t **dest, int dstW, int y)
Definition: output.c:1971

yuv2422_2_c_template
static av_always_inline void yuv2422_2_c_template(SwsContext *c, const int16_t *buf[2], const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf[2], uint8_t *dest, int dstW, int yalpha, int uvalpha, int y, enum AVPixelFormat target)
Definition: output.c:702

DECLARE_ALIGNED
#define DECLARE_ALIGNED(n, t, v)
Declare a variable that is aligned in memory.
Definition: mem.h:112

AV_PIX_FMT_GBRP16BE
planar GBR 4:4:4 48bpp, big-endian
Definition: pixfmt.h:170

yuv2rgb_full_2_c_template
static av_always_inline void yuv2rgb_full_2_c_template(SwsContext *c, const int16_t *buf[2], const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf[2], uint8_t *dest, int dstW, int yalpha, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha)
Definition: output.c:1845

swscale.h
external API header

yuv2rgb_full_X_c_template
static av_always_inline void yuv2rgb_full_X_c_template(SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t *dest, int dstW, int y, enum AVPixelFormat target, int hasAlpha)
Definition: output.c:1795

SwsContext::dstFormat
enum AVPixelFormat dstFormat
Destination pixel format.
Definition: swscale_internal.h:300

SwsContext::table_gU
uint8_t * table_gU[256+2 *YUVRGB_TABLE_HEADROOM]
Definition: swscale_internal.h:401

yuv2p010cX_c
static void yuv2p010cX_c(SwsContext *c, const int16_t *chrFilter, int chrFilterSize, const int16_t **chrUSrc, const int16_t **chrVSrc, uint8_t *dest8, int chrDstW)
Definition: output.c:380

yuv2p010l1_c
static void yuv2p010l1_c(const int16_t *src, uint16_t *dest, int dstW, int big_endian)
Definition: output.c:350

A
#define A(x)
Definition: vp56_arith.h:28

SwsContext::yuv2rgb_u2b_coeff
int yuv2rgb_u2b_coeff
Definition: swscale_internal.h:436

SwsContext::dither_error
int * dither_error[4]
Definition: swscale_internal.h:415

yuv2packed1_fn
void(* yuv2packed1_fn)(struct SwsContext *c, const int16_t *lumSrc, const int16_t *chrUSrc[2], const int16_t *chrVSrc[2], const int16_t *alpSrc, uint8_t *dest, int dstW, int uvalpha, int y)
Write one line of horizontally scaled Y/U/V/A to packed-pixel YUV/RGB output without any additional v...
Definition: swscale_internal.h:169

U
#define U(x)
Definition: vp56_arith.h:37

AV_PIX_FMT_GBRP9BE
planar GBR 4:4:4 27bpp, big-endian
Definition: pixfmt.h:166

A2
#define A2
Definition: binkdsp.c:32

B_R
#define B_R
Definition: output.c:796

SWS_DITHER_X_DITHER
Definition: swscale_internal.h:71

AV_PIX_FMT_BGR32_1
#define AV_PIX_FMT_BGR32_1
Definition: pixfmt.h:345

yuv2rgba64_full_1_c_template
static av_always_inline void yuv2rgba64_full_1_c_template(SwsContext *c, const int32_t *buf0, const int32_t *ubuf[2], const int32_t *vbuf[2], const int32_t *abuf0, uint16_t *dest, int dstW, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)
Definition: output.c:1171

R
#define R
Definition: huffyuvdsp.h:34

SWS_DITHER_AUTO
Definition: swscale_internal.h:67

AV_PIX_FMT_P016BE
like NV12, with 16bpp per component, big-endian
Definition: pixfmt.h:297

yuv2p010l1_BE_c
static void yuv2p010l1_BE_c(const int16_t *src, uint8_t *dest, int dstW, const uint8_t *dither, int offset)
Definition: output.c:410

d64
const uint8_t * d64
Definition: yuv2rgb.c:502

B
#define B
Definition: huffyuvdsp.h:32

AV_PIX_FMT_BGRA
packed BGRA 8:8:8:8, 32bpp, BGRABGRA...
Definition: pixfmt.h:91

r
const char * r
Definition: vf_curves.c:111

dither
static const uint8_t dither[8][8]
Definition: vf_fspp.c:57

yuv2rgba64_X_c_template
static av_always_inline void yuv2rgba64_X_c_template(SwsContext *c, const int16_t *lumFilter, const int32_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int32_t **chrUSrc, const int32_t **chrVSrc, int chrFilterSize, const int32_t **alpSrc, uint16_t *dest, int dstW, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)
Definition: output.c:805

yuv2p010lX_LE_c
static void yuv2p010lX_LE_c(const int16_t *filter, int filterSize, const int16_t **src, uint8_t *dest, int dstW, const uint8_t *dither, int offset)
Definition: output.c:417

AV_PIX_FMT_NV12
planar YUV 4:2:0, 12bpp, 1 plane for Y and 1 plane for the UV components, which are interleaved (firs...
Definition: pixfmt.h:85

avassert.h
simple assert() macros that are a bit more flexible than ISO C assert().

AV_PIX_FMT_P016LE
like NV12, with 16bpp per component, little-endian
Definition: pixfmt.h:296

AV_PIX_FMT_P010BE
like NV12, with 10bpp per component, data in the high bits, zeros in the low bits, big-endian
Definition: pixfmt.h:281

yuv2planeX_10_c_template
static av_always_inline void yuv2planeX_10_c_template(const int16_t *filter, int filterSize, const int16_t **src, uint16_t *dest, int dstW, int big_endian, int output_bits)
Definition: output.c:234

offset
static const uint8_t offset[127][2]
Definition: vf_spp.c:92

yuv2NBPS
#define yuv2NBPS(bits, BE_LE, is_be, template_size, typeX_t)
Definition: output.c:254

AV_PIX_FMT_ARGB
packed ARGB 8:8:8:8, 32bpp, ARGBARGB...
Definition: pixfmt.h:88

AV_PIX_FMT_BGR48LE
packed RGB 16:16:16, 48bpp, 16B, 16G, 16R, the 2-byte value for each R/G/B component is stored as lit...
Definition: pixfmt.h:145

AV_PIX_FMT_RGBA
packed RGBA 8:8:8:8, 32bpp, RGBARGBA...
Definition: pixfmt.h:89

SwsContext::yuv2rgb_v2r_coeff
int yuv2rgb_v2r_coeff
Definition: swscale_internal.h:433

yuv2mono_2_c_template
static av_always_inline void yuv2mono_2_c_template(SwsContext *c, const int16_t *buf[2], const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf[2], uint8_t *dest, int dstW, int yalpha, int uvalpha, int y, enum AVPixelFormat target)
Definition: output.c:498

yuv2422_1_c_template
static av_always_inline void yuv2422_1_c_template(SwsContext *c, const int16_t *buf0, const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf0, uint8_t *dest, int dstW, int uvalpha, int y, enum AVPixelFormat target)
Definition: output.c:735

AVPixFmtDescriptor::flags
uint64_t flags
Combination of AV_PIX_FMT_FLAG_...
Definition: pixdesc.h:106

AV_PIX_FMT_NV21
as above, but U and V bytes are swapped
Definition: pixfmt.h:86

AV_PIX_FMT_GBRAP12BE
planar GBR 4:4:4:4 48bpp, big-endian
Definition: pixfmt.h:283

yuv2planar1_fn
void(* yuv2planar1_fn)(const int16_t *src, uint8_t *dest, int dstW, const uint8_t *dither, int offset)
Write one line of horizontally scaled data to planar output without any additional vertical scaling (...
Definition: swscale_internal.h:98

AV_PIX_FMT_GBRAP10BE
planar GBR 4:4:4:4 40bpp, big-endian
Definition: pixfmt.h:286

pixdesc.h

yuv2ya8_X_c
static void yuv2ya8_X_c(SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t *dest, int dstW, int y)
Definition: output.c:2185

SwsContext::yuv2rgb_y_offset
int yuv2rgb_y_offset
Definition: swscale_internal.h:431

AV_PIX_FMT_RGB4_BYTE
packed RGB 1:2:1, 8bpp, (msb)1R 2G 1B(lsb)
Definition: pixfmt.h:84

yuv2mono_1_c_template
static av_always_inline void yuv2mono_1_c_template(SwsContext *c, const int16_t *buf0, const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf0, uint8_t *dest, int dstW, int uvalpha, int y, enum AVPixelFormat target)
Definition: output.c:559

intreadwrite.h

yuv2plane1_8_c
static void yuv2plane1_8_c(const int16_t *src, uint8_t *dest, int dstW, const uint8_t *dither, int offset)
Definition: output.c:296

int32_t
int32_t
Definition: audio_convert.c:194

AV_PIX_FMT_YVYU422
packed YUV 4:2:2, 16bpp, Y0 Cr Y1 Cb
Definition: pixfmt.h:206

SwsContext::table_gV
int table_gV[256+2 *YUVRGB_TABLE_HEADROOM]
Definition: swscale_internal.h:399

AV_PIX_FMT_BGR24
packed RGB 8:8:8, 24bpp, BGRBGR...
Definition: pixfmt.h:65

SwsContext::table_rV
uint8_t * table_rV[256+2 *YUVRGB_TABLE_HEADROOM]
Definition: swscale_internal.h:400

AV_PIX_FMT_P010LE
like NV12, with 10bpp per component, data in the high bits, zeros in the low bits, little-endian
Definition: pixfmt.h:280

swscale_internal.h

AV_PIX_FMT_BGR48BE
packed RGB 16:16:16, 48bpp, 16B, 16G, 16R, the 2-byte value for each R/G/B component is stored as big...
Definition: pixfmt.h:144

AV_PIX_FMT_BGR565BE
packed BGR 5:6:5, 16bpp, (msb) 5B 6G 5R(lsb), big-endian
Definition: pixfmt.h:106

AV_PIX_FMT_GBRAP12LE
planar GBR 4:4:4:4 48bpp, little-endian
Definition: pixfmt.h:284

AV_PIX_FMT_BGR555
#define AV_PIX_FMT_BGR555
Definition: pixfmt.h:361

AV_PIX_FMT_BGR32
#define AV_PIX_FMT_BGR32
Definition: pixfmt.h:344

isBE
static av_always_inline int isBE(enum AVPixelFormat pix_fmt)
Definition: swscale_internal.h:658

YUV2PACKED16WRAPPER
#define YUV2PACKED16WRAPPER(name, base, ext, fmt, hasAlpha, eightbytes)
Definition: output.c:1251

AV_PIX_FMT_BGR8
packed RGB 3:3:2, 8bpp, (msb)2B 3G 3R(lsb)
Definition: pixfmt.h:79

cpu.h

yuv2mono_X_c_template
static av_always_inline void yuv2mono_X_c_template(SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t *dest, int dstW, int y, enum AVPixelFormat target)
Definition: output.c:445

AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:81

yuv2ya8_1_c
static void yuv2ya8_1_c(SwsContext *c, const int16_t *buf0, const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf0, uint8_t *dest, int dstW, int uvalpha, int y)
Definition: output.c:2128

AV_PIX_FMT_GBRP10BE
planar GBR 4:4:4 30bpp, big-endian
Definition: pixfmt.h:168

AV_PIX_FMT_RGB32
#define AV_PIX_FMT_RGB32
Definition: pixfmt.h:342

yuv2rgb_2_c_template
static av_always_inline void yuv2rgb_2_c_template(SwsContext *c, const int16_t *buf[2], const int16_t *ubuf[2], const int16_t *vbuf[2], const int16_t *abuf[2], uint8_t *dest, int dstW, int yalpha, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha)
Definition: output.c:1505

AV_PIX_FMT_YUYV422
packed YUV 4:2:2, 16bpp, Y0 Cb Y1 Cr
Definition: pixfmt.h:63

AV_PIX_FMT_GBRP14LE
planar GBR 4:4:4 42bpp, little-endian
Definition: pixfmt.h:253

SwsContext::needAlpha
int needAlpha
Definition: swscale_internal.h:356

ff_dither_8x8_73
const uint8_t ff_dither_8x8_73[][8]
Definition: output.c:71

buf
void * buf
Definition: avisynth_c.h:690

yuv2422_X_c_template
static av_always_inline void yuv2422_X_c_template(SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t *dest, int dstW, int y, enum AVPixelFormat target)
Definition: output.c:663

bswap.h
byte swapping routines

d32
const uint8_t * d32
Definition: yuv2rgb.c:501

AV_PIX_FMT_GBRP14BE
planar GBR 4:4:4 42bpp, big-endian
Definition: pixfmt.h:252

yuv2rgb_write
static av_always_inline void yuv2rgb_write(uint8_t *_dest, int i, int Y1, int Y2, unsigned A1, unsigned A2, const void *_r, const void *_g, const void *_b, int y, enum AVPixelFormat target, int hasAlpha)
Definition: output.c:1332

AV_PIX_FMT_BGR555LE
packed BGR 5:5:5, 16bpp, (msb)1X 5B 5G 5R(lsb), little-endian, X=unused/undefined ...
Definition: pixfmt.h:109

SH
#define SH(val, pdst)
Definition: generic_macros_msa.h:151

yuv2rgba64_full_X_c_template
static av_always_inline void yuv2rgba64_full_X_c_template(SwsContext *c, const int16_t *lumFilter, const int32_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int32_t **chrUSrc, const int32_t **chrVSrc, int chrFilterSize, const int32_t **alpSrc, uint16_t *dest, int dstW, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)
Definition: output.c:1055

yuv2p010lX_c
static void yuv2p010lX_c(const int16_t *filter, int filterSize, const int16_t **src, uint16_t *dest, int dstW, int big_endian)
Definition: output.c:363

YUV2RGBWRAPPER
#define YUV2RGBWRAPPER(name, base, ext, fmt, hasAlpha)
Definition: output.c:1624

AV_PIX_FMT_BGR565
#define AV_PIX_FMT_BGR565
Definition: pixfmt.h:360

SwsContext::chrDither8
const uint8_t * chrDither8
Definition: swscale_internal.h:493

AV_PIX_FMT_RGB555BE
packed RGB 5:5:5, 16bpp, (msb)1X 5R 5G 5B(lsb), big-endian , X=unused/undefined
Definition: pixfmt.h:103

AV_PIX_FMT_BGR444BE
packed BGR 4:4:4, 16bpp, (msb)4X 4B 4G 4R(lsb), big-endian, X=unused/undefined
Definition: pixfmt.h:138

SwsContext::dither
SwsDither dither
Definition: swscale_internal.h:623

A_DITHER
#define A_DITHER(u, v)

AV_PIX_FMT_MONOBLACK
Y , 1bpp, 0 is black, 1 is white, in each byte pixels are ordered from the msb to the lsb...
Definition: pixfmt.h:72

yuv2planarX_fn
void(* yuv2planarX_fn)(const int16_t *filter, int filterSize, const int16_t **src, uint8_t *dest, int dstW, const uint8_t *dither, int offset)
Write one line of horizontally scaled data to planar output with multi-point vertical scaling between...
Definition: swscale_internal.h:114

if
if(ret< 0)
Definition: vf_mcdeint.c:279

yuv2packed2_fn
void(* yuv2packed2_fn)(struct SwsContext *c, const int16_t *lumSrc[2], const int16_t *chrUSrc[2], const int16_t *chrVSrc[2], const int16_t *alpSrc[2], uint8_t *dest, int dstW, int yalpha, int uvalpha, int y)
Write one line of horizontally scaled Y/U/V/A to packed-pixel YUV/RGB output by doing bilinear scalin...
Definition: swscale_internal.h:202

AV_PIX_FMT_MONOWHITE
Y , 1bpp, 0 is white, 1 is black, in each byte pixels are ordered from the msb to the lsb...
Definition: pixfmt.h:71

G
#define G
Definition: huffyuvdsp.h:33

AV_PIX_FMT_GBRAP
planar GBRA 4:4:4:4 32bpp
Definition: pixfmt.h:211

yuv2rgb_X_c_template
static av_always_inline void yuv2rgb_X_c_template(SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t *dest, int dstW, int y, enum AVPixelFormat target, int hasAlpha)
Definition: output.c:1451

AV_PIX_FMT_GBRP9LE
planar GBR 4:4:4 27bpp, little-endian
Definition: pixfmt.h:167

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

yuv2packedX_fn
void(* yuv2packedX_fn)(struct SwsContext *c, const int16_t *lumFilter, const int16_t **lumSrc, int lumFilterSize, const int16_t *chrFilter, const int16_t **chrUSrc, const int16_t **chrVSrc, int chrFilterSize, const int16_t **alpSrc, uint8_t *dest, int dstW, int y)
Write one line of horizontally scaled Y/U/V/A to packed-pixel YUV/RGB output by doing multi-point ver...
Definition: swscale_internal.h:234

AV_PIX_FMT_RGB48BE
packed RGB 16:16:16, 48bpp, 16R, 16G, 16B, the 2-byte value for each R/G/B component is stored as big...
Definition: pixfmt.h:98

AV_PIX_FMT_BGR444
#define AV_PIX_FMT_BGR444
Definition: pixfmt.h:362

AV_WL16
#define AV_WL16(p, v)
Definition: intreadwrite.h:412

output_pixel
#define output_pixel(pos, val, bias, signedness)
Definition: output.c:797

d128
const uint8_t * d128
Definition: yuv2rgb.c:553

AV_PIX_FMT_RGB8
packed RGB 3:3:2, 8bpp, (msb)2R 3G 3B(lsb)
Definition: pixfmt.h:82

AV_PIX_FMT_RGB555
#define AV_PIX_FMT_RGB555
Definition: pixfmt.h:356

yuv2rgb_write_full
static av_always_inline void yuv2rgb_write_full(SwsContext *c, uint8_t *dest, int i, int Y, int A, int U, int V, int y, enum AVPixelFormat target, int hasAlpha, int err[4])
Definition: output.c:1655

yuv2rgba64_full_2_c_template
static av_always_inline void yuv2rgba64_full_2_c_template(SwsContext *c, const int32_t *buf[2], const int32_t *ubuf[2], const int32_t *vbuf[2], const int32_t *abuf[2], uint16_t *dest, int dstW, int yalpha, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)
Definition: output.c:1119

SWS_DITHER_ED
Definition: swscale_internal.h:69

yuv2rgba64_1_c_template
static av_always_inline void yuv2rgba64_1_c_template(SwsContext *c, const int32_t *buf0, const int32_t *ubuf[2], const int32_t *vbuf[2], const int32_t *abuf0, uint16_t *dest, int dstW, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)
Definition: output.c:952

AV_PIX_FMT_RGB32_1
#define AV_PIX_FMT_RGB32_1
Definition: pixfmt.h:343

yuv2plane1_10_c_template
static av_always_inline void yuv2plane1_10_c_template(const int16_t *src, uint16_t *dest, int dstW, int big_endian, int output_bits)
Definition: output.c:221

yuv2nv12cX_c
static void yuv2nv12cX_c(SwsContext *c, const int16_t *chrFilter, int chrFilterSize, const int16_t **chrUSrc, const int16_t **chrVSrc, uint8_t *dest, int chrDstW)
Definition: output.c:306

yuv2rgba64_2_c_template
static av_always_inline void yuv2rgba64_2_c_template(SwsContext *c, const int32_t *buf[2], const int32_t *ubuf[2], const int32_t *vbuf[2], const int32_t *abuf[2], uint16_t *dest, int dstW, int yalpha, int uvalpha, int y, enum AVPixelFormat target, int hasAlpha, int eightbytes)
Definition: output.c:887

AV_PIX_FMT_RGB565
#define AV_PIX_FMT_RGB565
Definition: pixfmt.h:355

AV_PIX_FMT_BGR555BE
packed BGR 5:5:5, 16bpp, (msb)1X 5B 5G 5R(lsb), big-endian , X=unused/undefined
Definition: pixfmt.h:108

SwsContext::yuv2rgb_v2g_coeff
int yuv2rgb_v2g_coeff
Definition: swscale_internal.h:434

R_B
#define R_B
Definition: output.c:795

av_always_inline
#define av_always_inline
Definition: attributes.h:39

AV_PIX_FMT_GBRP16LE
planar GBR 4:4:4 48bpp, little-endian
Definition: pixfmt.h:171

AV_PIX_FMT_BGR444LE
packed BGR 4:4:4, 16bpp, (msb)4X 4B 4G 4R(lsb), little-endian, X=unused/undefined ...
Definition: pixfmt.h:137

yuv2p016cX_c
static void yuv2p016cX_c(SwsContext *c, const int16_t *chrFilter, int chrFilterSize, const int16_t **chrUSrc, const int16_t **chrVSrc, uint8_t *dest8, int chrDstW)
Definition: output.c:183

SwsContext
Definition: swscale_internal.h:280

AVComponentDescriptor::depth
int depth
Number of bits in the component.
Definition: pixdesc.h:58

AV_PIX_FMT_GBRAP16LE
planar GBRA 4:4:4:4 64bpp, little-endian
Definition: pixfmt.h:213

YUV2PACKEDWRAPPER
#define YUV2PACKEDWRAPPER(name, base, ext, fmt)
Definition: output.c:609

SwsContext::flags
int flags
Flags passed by the user to select scaler algorithm, optimizations, subsampling, etc...
Definition: swscale_internal.h:395

AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:60

isNBPS
static av_always_inline int isNBPS(enum AVPixelFormat pix_fmt)
Definition: swscale_internal.h:651

SWS_DITHER_A_DITHER
Definition: swscale_internal.h:70

AV_PIX_FMT_GBRP10LE
planar GBR 4:4:4 30bpp, little-endian
Definition: pixfmt.h:169

AV_PIX_FMT_RGBA64LE
packed RGBA 16:16:16:16, 64bpp, 16R, 16G, 16B, 16A, the 2-byte value for each R/G/B/A component is st...
Definition: pixfmt.h:202

AV_PIX_FMT_AYUV64LE
packed AYUV 4:4:4,64bpp (1 Cr & Cb sample per 1x1 Y & A samples), little-endian
Definition: pixfmt.h:275

V
#define V
Definition: avdct.c:30