doxygen/4.1/vf__fspp_8c_source.html

 /*

  * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>

  * Copyright (C) 2005 Nikolaj Poroshin <porosh3@psu.ru>

  * Copyright (c) 2014 Arwa Arif <arwaarif1994@gmail.com>

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 2 of the License, or

  * (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU General Public License for more details.

  *

  * You should have received a copy of the GNU General Public License along

  * with FFmpeg; if not, write to the Free Software Foundation, Inc.,

  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.

  */


 /**

  * @file

  * Fast Simple Post-processing filter

  * This implementation is based on an algorithm described in

  * "Aria Nosratinia Embedded Post-Processing for

  * Enhancement of Compressed Images (1999)"

  * (http://www.utdallas.edu/~aria/papers/vlsisp99.pdf)

  * Further, with splitting (I)DCT into horizontal/vertical passes, one of

  * them can be performed once per block, not per pixel. This allows for much

  * higher speed.

  *

  * Originally written by Michael Niedermayer and Nikolaj for the MPlayer

  * project, and ported by Arwa Arif for FFmpeg.

  */


 #include "libavutil/avassert.h"

 #include "libavutil/imgutils.h"

 #include "libavutil/opt.h"

 #include "libavutil/pixdesc.h"

 #include "internal.h"

 #include "vf_fspp.h"


 #define OFFSET(x) offsetof(FSPPContext, x)

 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM

 static const AVOption fspp_options[] = {

     { "quality",       "set quality",                          OFFSET(log2_count),    AV_OPT_TYPE_INT, {.i64 = 4},   4, MAX_LEVEL, FLAGS },

     { "qp",            "force a constant quantizer parameter", OFFSET(qp),            AV_OPT_TYPE_INT, {.i64 = 0},   0, 64,        FLAGS },

     { "strength",      "set filter strength",                  OFFSET(strength),      AV_OPT_TYPE_INT, {.i64 = 0}, -15, 32,        FLAGS },

     { "use_bframe_qp", "use B-frames' QP",                     OFFSET(use_bframe_qp), AV_OPT_TYPE_BOOL,{.i64 = 0},   0, 1,         FLAGS },

     { NULL }

 };


 AVFILTER_DEFINE_CLASS(fspp);


 DECLARE_ALIGNED(32, static const uint8_t, dither)[8][8] = {

     {  0,  48,  12,  60,   3,  51,  15,  63, },

     { 32,  16,  44,  28,  35,  19,  47,  31, },

     {  8,  56,   4,  52,  11,  59,   7,  55, },

     { 40,  24,  36,  20,  43,  27,  39,  23, },

     {  2,  50,  14,  62,   1,  49,  13,  61, },

     { 34,  18,  46,  30,  33,  17,  45,  29, },

     { 10,  58,   6,  54,   9,  57,   5,  53, },

     { 42,  26,  38,  22,  41,  25,  37,  21, },

 };


 static const short custom_threshold[64] = {

 // values (296) can't be too high

 // -it causes too big quant dependence

 // or maybe overflow(check), which results in some flashing

      71, 296, 295, 237,  71,  40,  38,  19,

     245, 193, 185, 121, 102,  73,  53,  27,

     158, 129, 141, 107,  97,  73,  50,  26,

     102, 116, 109,  98,  82,  66,  45,  23,

      71,  94,  95,  81,  70,  56,  38,  20,

      56,  77,  74,  66,  56,  44,  30,  15,

      38,  53,  50,  45,  38,  30,  21,  11,

      20,  27,  26,  23,  20,  15,  11,   5

 };


 //This func reads from 1 slice, 1 and clears 0 & 1

 static void store_slice_c(uint8_t *dst, int16_t *src,

                           ptrdiff_t dst_stride, ptrdiff_t src_stride,

                           ptrdiff_t width, ptrdiff_t height, ptrdiff_t log2_scale)

 {

     int y, x;

 #define STORE(pos)                                                             \

     temp = (src[x + pos] + (d[pos] >> log2_scale)) >> (6 - log2_scale);        \

     src[x + pos] = src[x + pos - 8 * src_stride] = 0;                          \

     if (temp & 0x100) temp = ~(temp >> 31);                                    \

     dst[x + pos] = temp;


     for (y = 0; y < height; y++) {

         const uint8_t *d = dither[y];

         for (x = 0; x < width; x += 8) {

             int temp;

             STORE(0);

             STORE(1);

             STORE(2);

             STORE(3);

             STORE(4);

             STORE(5);

             STORE(6);

             STORE(7);

         }

         src += src_stride;

         dst += dst_stride;

     }

 }


 //This func reads from 2 slices, 0 & 2  and clears 2-nd

 static void store_slice2_c(uint8_t *dst, int16_t *src,

                            ptrdiff_t dst_stride, ptrdiff_t src_stride,

                            ptrdiff_t width, ptrdiff_t height, ptrdiff_t log2_scale)

 {

     int y, x;

 #define STORE2(pos)                                                                                       \

     temp = (src[x + pos] + src[x + pos + 16 * src_stride] + (d[pos] >> log2_scale)) >> (6 - log2_scale);  \

     src[x + pos + 16 * src_stride] = 0;                                                                   \

     if (temp & 0x100) temp = ~(temp >> 31);                                                               \

     dst[x + pos] = temp;


     for (y = 0; y < height; y++) {

         const uint8_t *d = dither[y];

         for (x = 0; x < width; x += 8) {

             int temp;

             STORE2(0);

             STORE2(1);

             STORE2(2);

             STORE2(3);

             STORE2(4);

             STORE2(5);

             STORE2(6);

             STORE2(7);

         }

         src += src_stride;

         dst += dst_stride;

     }

 }


 static void mul_thrmat_c(int16_t *thr_adr_noq, int16_t *thr_adr, int q)

 {

     int a;

     for (a = 0; a < 64; a++)

         thr_adr[a] = q * thr_adr_noq[a];

 }


 static void filter(FSPPContext *p, uint8_t *dst, uint8_t *src,

                    int dst_stride, int src_stride,

                    int width, int height,

                    uint8_t *qp_store, int qp_stride, int is_luma)

 {

     int x, x0, y, es, qy, t;


     const int stride = is_luma ? p->temp_stride : (width + 16);

     const int step = 6 - p->log2_count;

     const int qpsh = 4 - p->hsub * !is_luma;

     const int qpsv = 4 - p->vsub * !is_luma;


     DECLARE_ALIGNED(32, int32_t, block_align)[4 * 8 * BLOCKSZ + 4 * 8 * BLOCKSZ];

     int16_t *block  = (int16_t *)block_align;

     int16_t *block3 = (int16_t *)(block_align + 4 * 8 * BLOCKSZ);


     memset(block3, 0, 4 * 8 * BLOCKSZ);


     if (!src || !dst) return;


     for (y = 0; y < height; y++) {

         int index = 8 + 8 * stride + y * stride;

         memcpy(p->src + index, src + y * src_stride, width);

         for (x = 0; x < 8; x++) {

             p->src[index         - x - 1] = p->src[index +         x    ];

             p->src[index + width + x    ] = p->src[index + width - x - 1];

         }

     }


     for (y = 0; y < 8; y++) {

         memcpy(p->src + (     7 - y    ) * stride, p->src + (     y + 8    ) * stride, stride);

         memcpy(p->src + (height + 8 + y) * stride, p->src + (height - y + 7) * stride, stride);

     }

     //FIXME (try edge emu)


     for (y = 8; y < 24; y++)

         memset(p->temp + 8 + y * stride, 0, width * sizeof(int16_t));


     for (y = step; y < height + 8; y += step) {    //step= 1,2

         const int y1 = y - 8 + step;                 //l5-7  l4-6;

         qy = y - 4;


         if (qy > height - 1) qy = height - 1;

         if (qy < 0) qy = 0;


         qy = (qy >> qpsv) * qp_stride;

         p->row_fdct(block, p->src + y * stride + 2 - (y&1), stride, 2);


         for (x0 = 0; x0 < width + 8 - 8 * (BLOCKSZ - 1); x0 += 8 * (BLOCKSZ - 1)) {

             p->row_fdct(block + 8 * 8, p->src + y * stride + 8 + x0 + 2 - (y&1), stride, 2 * (BLOCKSZ - 1));


             if (p->qp)

                 p->column_fidct((int16_t *)(&p->threshold_mtx[0]), block + 0 * 8, block3 + 0 * 8, 8 * (BLOCKSZ - 1)); //yes, this is a HOTSPOT

             else

                 for (x = 0; x < 8 * (BLOCKSZ - 1); x += 8) {

                     t = x + x0 - 2;                    //correct t=x+x0-2-(y&1), but its the same


                     if (t < 0) t = 0;                   //t always < width-2


                     t = qp_store[qy + (t >> qpsh)];

                     t = ff_norm_qscale(t, p->qscale_type);


                     if (t != p->prev_q) p->prev_q = t, p->mul_thrmat((int16_t *)(&p->threshold_mtx_noq[0]), (int16_t *)(&p->threshold_mtx[0]), t);

                     p->column_fidct((int16_t *)(&p->threshold_mtx[0]), block + x * 8, block3 + x * 8, 8); //yes, this is a HOTSPOT

                 }

             p->row_idct(block3 + 0 * 8, p->temp + (y & 15) * stride + x0 + 2 - (y & 1), stride, 2 * (BLOCKSZ - 1));

             memmove(block,  block  + (BLOCKSZ - 1) * 64, 8 * 8 * sizeof(int16_t)); //cycling

             memmove(block3, block3 + (BLOCKSZ - 1) * 64, 6 * 8 * sizeof(int16_t));

         }


         es = width + 8 - x0; //  8, ...

         if (es > 8)

             p->row_fdct(block + 8 * 8, p->src + y * stride + 8 + x0 + 2 - (y & 1), stride, (es - 4) >> 2);


         p->column_fidct((int16_t *)(&p->threshold_mtx[0]), block, block3, es&(~1));

         if (es > 3)

             p->row_idct(block3 + 0 * 8, p->temp + (y & 15) * stride + x0 + 2 - (y & 1), stride, es >> 2);


         if (!(y1 & 7) && y1) {

             if (y1 & 8)

                 p->store_slice(dst + (y1 - 8) * dst_stride, p->temp + 8 + 8 * stride,

                                dst_stride, stride, width, 8, 5 - p->log2_count);

             else

                 p->store_slice2(dst + (y1 - 8) * dst_stride, p->temp + 8 + 0 * stride,

                                 dst_stride, stride, width, 8, 5 - p->log2_count);

         }

     }


     if (y & 7) {  // height % 8 != 0

         if (y & 8)

             p->store_slice(dst + ((y - 8) & ~7) * dst_stride, p->temp + 8 + 8 * stride,

                            dst_stride, stride, width, y&7, 5 - p->log2_count);

         else

             p->store_slice2(dst + ((y - 8) & ~7) * dst_stride, p->temp + 8 + 0 * stride,

                             dst_stride, stride, width, y&7, 5 - p->log2_count);

     }

 }


 static void column_fidct_c(int16_t *thr_adr, int16_t *data, int16_t *output, int cnt)

 {

     int_simd16_t tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;

     int_simd16_t tmp10, tmp11, tmp12, tmp13;

     int_simd16_t z1,z2,z3,z4,z5, z10, z11, z12, z13;

     int_simd16_t d0, d1, d2, d3, d4, d5, d6, d7;


     int16_t *dataptr;

     int16_t *wsptr;

     int16_t *threshold;

     int ctr;


     dataptr = data;

     wsptr = output;


     for (; cnt > 0; cnt -= 2) { //start positions

         threshold = (int16_t *)thr_adr;//threshold_mtx

         for (ctr = DCTSIZE; ctr > 0; ctr--) {

             // Process columns from input, add to output.

             tmp0 = dataptr[DCTSIZE * 0] + dataptr[DCTSIZE * 7];

             tmp7 = dataptr[DCTSIZE * 0] - dataptr[DCTSIZE * 7];


             tmp1 = dataptr[DCTSIZE * 1] + dataptr[DCTSIZE * 6];

             tmp6 = dataptr[DCTSIZE * 1] - dataptr[DCTSIZE * 6];


             tmp2 = dataptr[DCTSIZE * 2] + dataptr[DCTSIZE * 5];

             tmp5 = dataptr[DCTSIZE * 2] - dataptr[DCTSIZE * 5];


             tmp3 = dataptr[DCTSIZE * 3] + dataptr[DCTSIZE * 4];

             tmp4 = dataptr[DCTSIZE * 3] - dataptr[DCTSIZE * 4];


             // Even part of FDCT


             tmp10 = tmp0 + tmp3;

             tmp13 = tmp0 - tmp3;

             tmp11 = tmp1 + tmp2;

             tmp12 = tmp1 - tmp2;


             d0 = tmp10 + tmp11;

             d4 = tmp10 - tmp11;


             z1 = MULTIPLY16H((tmp12 + tmp13) << 2, FIX_0_707106781);

             d2 = tmp13 + z1;

             d6 = tmp13 - z1;


             // Even part of IDCT


             THRESHOLD(tmp0, d0, threshold[0 * 8]);

             THRESHOLD(tmp1, d2, threshold[2 * 8]);

             THRESHOLD(tmp2, d4, threshold[4 * 8]);

             THRESHOLD(tmp3, d6, threshold[6 * 8]);

             tmp0 += 2;

             tmp10 = (tmp0 + tmp2) >> 2;

             tmp11 = (tmp0 - tmp2) >> 2;


             tmp13 = (tmp1 + tmp3) >>2; //+2 !  (psnr decides)

             tmp12 = MULTIPLY16H((tmp1 - tmp3), FIX_1_414213562_A) - tmp13; //<<2


             tmp0 = tmp10 + tmp13; //->temps

             tmp3 = tmp10 - tmp13; //->temps

             tmp1 = tmp11 + tmp12; //->temps

             tmp2 = tmp11 - tmp12; //->temps


             // Odd part of FDCT


             tmp10 = tmp4 + tmp5;

             tmp11 = tmp5 + tmp6;

             tmp12 = tmp6 + tmp7;


             z5 = MULTIPLY16H((tmp10 - tmp12) << 2, FIX_0_382683433);

             z2 = MULTIPLY16H(tmp10 << 2, FIX_0_541196100) + z5;

             z4 = MULTIPLY16H(tmp12 << 2, FIX_1_306562965) + z5;

             z3 = MULTIPLY16H(tmp11 << 2, FIX_0_707106781);


             z11 = tmp7 + z3;

             z13 = tmp7 - z3;


             d5 = z13 + z2;

             d3 = z13 - z2;

             d1 = z11 + z4;

             d7 = z11 - z4;


             // Odd part of IDCT


             THRESHOLD(tmp4, d1, threshold[1 * 8]);

             THRESHOLD(tmp5, d3, threshold[3 * 8]);

             THRESHOLD(tmp6, d5, threshold[5 * 8]);

             THRESHOLD(tmp7, d7, threshold[7 * 8]);


             //Simd version uses here a shortcut for the tmp5,tmp6,tmp7 == 0

             z13 = tmp6 + tmp5;

             z10 = (tmp6 - tmp5) << 1;

             z11 = tmp4 + tmp7;

             z12 = (tmp4 - tmp7) << 1;


             tmp7  = (z11 + z13) >> 2; //+2 !

             tmp11 = MULTIPLY16H((z11 - z13) << 1, FIX_1_414213562);

             z5    = MULTIPLY16H(z10 + z12,        FIX_1_847759065);

             tmp10 = MULTIPLY16H(z12,              FIX_1_082392200) - z5;

             tmp12 = MULTIPLY16H(z10,              FIX_2_613125930) + z5; // - !!


             tmp6 = tmp12 - tmp7;

             tmp5 = tmp11 - tmp6;

             tmp4 = tmp10 + tmp5;


             wsptr[DCTSIZE * 0] +=  (tmp0 + tmp7);

             wsptr[DCTSIZE * 1] +=  (tmp1 + tmp6);

             wsptr[DCTSIZE * 2] +=  (tmp2 + tmp5);

             wsptr[DCTSIZE * 3] +=  (tmp3 - tmp4);

             wsptr[DCTSIZE * 4] +=  (tmp3 + tmp4);

             wsptr[DCTSIZE * 5] +=  (tmp2 - tmp5);

             wsptr[DCTSIZE * 6]  =  (tmp1 - tmp6);

             wsptr[DCTSIZE * 7]  =  (tmp0 - tmp7);

             //

             dataptr++; //next column

             wsptr++;

             threshold++;

         }

         dataptr += 8; //skip each second start pos

         wsptr   += 8;

     }

 }


 static void row_idct_c(int16_t *workspace, int16_t *output_adr, ptrdiff_t output_stride, int cnt)

 {

     int_simd16_t tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;

     int_simd16_t tmp10, tmp11, tmp12, tmp13;

     int_simd16_t z5, z10, z11, z12, z13;

     int16_t *outptr;

     int16_t *wsptr;


     cnt *= 4;

     wsptr = workspace;

     outptr = output_adr;

     for (; cnt > 0; cnt--) {

         // Even part

         //Simd version reads 4x4 block and transposes it

         tmp10 = wsptr[2] +  wsptr[3];

         tmp11 = wsptr[2] -  wsptr[3];


         tmp13 = wsptr[0] +  wsptr[1];

         tmp12 = (MULTIPLY16H(wsptr[0] - wsptr[1], FIX_1_414213562_A) << 2) - tmp13;//this shift order to avoid overflow


         tmp0 = tmp10 + tmp13; //->temps

         tmp3 = tmp10 - tmp13; //->temps

         tmp1 = tmp11 + tmp12;

         tmp2 = tmp11 - tmp12;


         // Odd part

         //Also transpose, with previous:

         // ---- ----      ||||

         // ---- ---- idct ||||

         // ---- ---- ---> ||||

         // ---- ----      ||||

         z13 = wsptr[4] + wsptr[5];

         z10 = wsptr[4] - wsptr[5];

         z11 = wsptr[6] + wsptr[7];

         z12 = wsptr[6] - wsptr[7];


         tmp7 = z11 + z13;

         tmp11 = MULTIPLY16H(z11 - z13, FIX_1_414213562);


         z5 =    MULTIPLY16H(z10 + z12, FIX_1_847759065);

         tmp10 = MULTIPLY16H(z12,       FIX_1_082392200) - z5;

         tmp12 = MULTIPLY16H(z10,       FIX_2_613125930) + z5; // - FIX_


         tmp6 = (tmp12 << 3) - tmp7;

         tmp5 = (tmp11 << 3) - tmp6;

         tmp4 = (tmp10 << 3) + tmp5;


         // Final output stage: descale and write column

         outptr[0 * output_stride] += DESCALE(tmp0 + tmp7, 3);

         outptr[1 * output_stride] += DESCALE(tmp1 + tmp6, 3);

         outptr[2 * output_stride] += DESCALE(tmp2 + tmp5, 3);

         outptr[3 * output_stride] += DESCALE(tmp3 - tmp4, 3);

         outptr[4 * output_stride] += DESCALE(tmp3 + tmp4, 3);

         outptr[5 * output_stride] += DESCALE(tmp2 - tmp5, 3);

         outptr[6 * output_stride] += DESCALE(tmp1 - tmp6, 3); //no += ?

         outptr[7 * output_stride] += DESCALE(tmp0 - tmp7, 3); //no += ?

         outptr++;


         wsptr += DCTSIZE;       // advance pointer to next row

     }

 }


 static void row_fdct_c(int16_t *data, const uint8_t *pixels, ptrdiff_t line_size, int cnt)

 {

     int_simd16_t tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;

     int_simd16_t tmp10, tmp11, tmp12, tmp13;

     int_simd16_t z1, z2, z3, z4, z5, z11, z13;

     int16_t *dataptr;


     cnt *= 4;

     // Pass 1: process rows.


     dataptr = data;

     for (; cnt > 0; cnt--) {

         tmp0 = pixels[line_size * 0] + pixels[line_size * 7];

         tmp7 = pixels[line_size * 0] - pixels[line_size * 7];

         tmp1 = pixels[line_size * 1] + pixels[line_size * 6];

         tmp6 = pixels[line_size * 1] - pixels[line_size * 6];

         tmp2 = pixels[line_size * 2] + pixels[line_size * 5];

         tmp5 = pixels[line_size * 2] - pixels[line_size * 5];

         tmp3 = pixels[line_size * 3] + pixels[line_size * 4];

         tmp4 = pixels[line_size * 3] - pixels[line_size * 4];


         // Even part


         tmp10 = tmp0 + tmp3;

         tmp13 = tmp0 - tmp3;

         tmp11 = tmp1 + tmp2;

         tmp12 = tmp1 - tmp2;

         //Even columns are written first, this leads to different order of columns

         //in column_fidct(), but they are processed independently, so all ok.

         //Later in the row_idct() columns readed at the same order.

         dataptr[2] = tmp10 + tmp11;

         dataptr[3] = tmp10 - tmp11;


         z1 = MULTIPLY16H((tmp12 + tmp13) << 2, FIX_0_707106781);

         dataptr[0] = tmp13 + z1;

         dataptr[1] = tmp13 - z1;


         // Odd part


         tmp10 = (tmp4 + tmp5) << 2;

         tmp11 = (tmp5 + tmp6) << 2;

         tmp12 = (tmp6 + tmp7) << 2;


         z5 = MULTIPLY16H(tmp10 - tmp12, FIX_0_382683433);

         z2 = MULTIPLY16H(tmp10,         FIX_0_541196100) + z5;

         z4 = MULTIPLY16H(tmp12,         FIX_1_306562965) + z5;

         z3 = MULTIPLY16H(tmp11,         FIX_0_707106781);


         z11 = tmp7 + z3;

         z13 = tmp7 - z3;


         dataptr[4] = z13 + z2;

         dataptr[5] = z13 - z2;

         dataptr[6] = z11 + z4;

         dataptr[7] = z11 - z4;


         pixels++;               // advance pointer to next column

         dataptr += DCTSIZE;

     }

 }


 static int query_formats(AVFilterContext *ctx)

 {

     static const enum AVPixelFormat pix_fmts[] = {

         AV_PIX_FMT_YUV444P,  AV_PIX_FMT_YUV422P,

         AV_PIX_FMT_YUV420P,  AV_PIX_FMT_YUV411P,

         AV_PIX_FMT_YUV410P,  AV_PIX_FMT_YUV440P,

         AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVJ422P,

         AV_PIX_FMT_YUVJ420P, AV_PIX_FMT_YUVJ440P,

         AV_PIX_FMT_GBRP, AV_PIX_FMT_GRAY8,

         AV_PIX_FMT_NONE

     };


     AVFilterFormats *fmts_list = ff_make_format_list(pix_fmts);

     if (!fmts_list)

         return AVERROR(ENOMEM);

     return ff_set_common_formats(ctx, fmts_list);

 }


 static int config_input(AVFilterLink *inlink)

 {

     AVFilterContext *ctx = inlink->dst;

     FSPPContext *fspp = ctx->priv;

     const int h = FFALIGN(inlink->h + 16, 16);

     const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);


     fspp->hsub = desc->log2_chroma_w;

     fspp->vsub = desc->log2_chroma_h;


     fspp->temp_stride = FFALIGN(inlink->w + 16, 16);

     fspp->temp = av_malloc_array(fspp->temp_stride, h * sizeof(*fspp->temp));

     fspp->src  = av_malloc_array(fspp->temp_stride, h * sizeof(*fspp->src));


     if (!fspp->temp || !fspp->src)

         return AVERROR(ENOMEM);


     if (!fspp->use_bframe_qp && !fspp->qp) {

         fspp->non_b_qp_alloc_size = AV_CEIL_RSHIFT(inlink->w, 4) * AV_CEIL_RSHIFT(inlink->h, 4);

         fspp->non_b_qp_table = av_calloc(fspp->non_b_qp_alloc_size, sizeof(*fspp->non_b_qp_table));

         if (!fspp->non_b_qp_table)

             return AVERROR(ENOMEM);

     }


     fspp->store_slice  = store_slice_c;

     fspp->store_slice2 = store_slice2_c;

     fspp->mul_thrmat   = mul_thrmat_c;

     fspp->column_fidct = column_fidct_c;

     fspp->row_idct     = row_idct_c;

     fspp->row_fdct     = row_fdct_c;


     if (ARCH_X86)

         ff_fspp_init_x86(fspp);


     return 0;

 }


 static int filter_frame(AVFilterLink *inlink, AVFrame *in)

 {

     AVFilterContext *ctx = inlink->dst;

     FSPPContext *fspp = ctx->priv;

     AVFilterLink *outlink = ctx->outputs[0];

     AVFrame *out = in;


     int qp_stride = 0;

     uint8_t *qp_table = NULL;

     int i, bias;

     int custom_threshold_m[64];


     bias = (1 << 4) + fspp->strength;


     for (i = 0; i < 64; i++) //FIXME: tune custom_threshold[] and remove this !

         custom_threshold_m[i] = (int)(custom_threshold[i] * (bias / 71.0) + 0.5);


     for (i = 0; i < 8; i++) {

         fspp->threshold_mtx_noq[2 * i] = (uint64_t)custom_threshold_m[i * 8 + 2]

                                       |(((uint64_t)custom_threshold_m[i * 8 + 6]) << 16)

                                       |(((uint64_t)custom_threshold_m[i * 8 + 0]) << 32)

                                       |(((uint64_t)custom_threshold_m[i * 8 + 4]) << 48);


         fspp->threshold_mtx_noq[2 * i + 1] = (uint64_t)custom_threshold_m[i * 8 + 5]

                                           |(((uint64_t)custom_threshold_m[i * 8 + 3]) << 16)

                                           |(((uint64_t)custom_threshold_m[i * 8 + 1]) << 32)

                                           |(((uint64_t)custom_threshold_m[i * 8 + 7]) << 48);

     }


     if (fspp->qp)

         fspp->prev_q = fspp->qp, fspp->mul_thrmat((int16_t *)(&fspp->threshold_mtx_noq[0]), (int16_t *)(&fspp->threshold_mtx[0]), fspp->qp);


     /* if we are not in a constant user quantizer mode and we don't want to use

      * the quantizers from the B-frames (B-frames often have a higher QP), we

      * need to save the qp table from the last non B-frame; this is what the

      * following code block does */

     if (!fspp->qp) {

         qp_table = av_frame_get_qp_table(in, &qp_stride, &fspp->qscale_type);


         if (qp_table && !fspp->use_bframe_qp && in->pict_type != AV_PICTURE_TYPE_B) {

             int w, h;


             /* if the qp stride is not set, it means the QP are only defined on

              * a line basis */

            if (!qp_stride) {

                 w = AV_CEIL_RSHIFT(inlink->w, 4);

                 h = 1;

             } else {

                 w = qp_stride;

                 h = AV_CEIL_RSHIFT(inlink->h, 4);

             }

             if (w * h > fspp->non_b_qp_alloc_size) {

                 int ret = av_reallocp_array(&fspp->non_b_qp_table, w, h);

                 if (ret < 0) {

                     fspp->non_b_qp_alloc_size = 0;

                     return ret;

                 }

                 fspp->non_b_qp_alloc_size = w * h;

             }


             av_assert0(w * h <= fspp->non_b_qp_alloc_size);

             memcpy(fspp->non_b_qp_table, qp_table, w * h);

         }

     }


     if (fspp->log2_count && !ctx->is_disabled) {

         if (!fspp->use_bframe_qp && fspp->non_b_qp_table)

             qp_table = fspp->non_b_qp_table;


         if (qp_table || fspp->qp) {

             const int cw = AV_CEIL_RSHIFT(inlink->w, fspp->hsub);

             const int ch = AV_CEIL_RSHIFT(inlink->h, fspp->vsub);


             /* get a new frame if in-place is not possible or if the dimensions

              * are not multiple of 8 */

             if (!av_frame_is_writable(in) || (inlink->w & 7) || (inlink->h & 7)) {

                 const int aligned_w = FFALIGN(inlink->w, 8);

                 const int aligned_h = FFALIGN(inlink->h, 8);


                 out = ff_get_video_buffer(outlink, aligned_w, aligned_h);

                 if (!out) {

                     av_frame_free(&in);

                     return AVERROR(ENOMEM);

                 }

                 av_frame_copy_props(out, in);

                 out->width = in->width;

                 out->height = in->height;

             }


             filter(fspp, out->data[0], in->data[0], out->linesize[0], in->linesize[0],

                    inlink->w, inlink->h, qp_table, qp_stride, 1);

             filter(fspp, out->data[1], in->data[1], out->linesize[1], in->linesize[1],

                    cw,        ch,        qp_table, qp_stride, 0);

             filter(fspp, out->data[2], in->data[2], out->linesize[2], in->linesize[2],

                    cw,        ch,        qp_table, qp_stride, 0);

             emms_c();

         }

     }


     if (in != out) {

         if (in->data[3])

             av_image_copy_plane(out->data[3], out->linesize[3],

                                 in ->data[3], in ->linesize[3],

                                 inlink->w, inlink->h);

         av_frame_free(&in);

     }

     return ff_filter_frame(outlink, out);

 }


 static av_cold void uninit(AVFilterContext *ctx)

 {

     FSPPContext *fspp = ctx->priv;

     av_freep(&fspp->temp);

     av_freep(&fspp->src);

     av_freep(&fspp->non_b_qp_table);

 }


 static const AVFilterPad fspp_inputs[] = {

     {

         .name         = "default",

         .type         = AVMEDIA_TYPE_VIDEO,

         .config_props = config_input,

         .filter_frame = filter_frame,

     },

     { NULL }

 };


 static const AVFilterPad fspp_outputs[] = {

     {

         .name = "default",

         .type = AVMEDIA_TYPE_VIDEO,

     },

     { NULL }

 };


 AVFilter ff_vf_fspp = {

     .name            = "fspp",

     .description     = NULL_IF_CONFIG_SMALL("Apply Fast Simple Post-processing filter."),

     .priv_size       = sizeof(FSPPContext),

     .uninit          = uninit,

     .query_formats   = query_formats,

     .inputs          = fspp_inputs,

     .outputs         = fspp_outputs,

     .priv_class      = &fspp_class,

     .flags           = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,

 };

FIX_1_414213562_A
static const int16_t FIX_1_414213562_A
Definition: vf_fspp.h:49

NULL
#define NULL
Definition: coverity.c:32

column_fidct_c
static void column_fidct_c(int16_t *thr_adr, int16_t *data, int16_t *output, int cnt)
Definition: vf_fspp.c:247

av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2446

FSPPContext::threshold_mtx_noq
uint64_t threshold_mtx_noq[8 *2]
Definition: vf_fspp.h:57

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:226

AV_PIX_FMT_NONE
Definition: pixfmt.h:65

h
h
Definition: vp9dsp_template.c:2038

AVOption
AVOption.
Definition: opt.h:246

data
ptrdiff_t const GLvoid * data
Definition: opengl_enc.c:101

FSPPContext::non_b_qp_table
uint8_t * non_b_qp_table
Definition: vf_fspp.h:70

AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:71

imgutils.h
misc image utilities

store_slice2_c
static void store_slice2_c(uint8_t *dst, int16_t *src, ptrdiff_t dst_stride, ptrdiff_t src_stride, ptrdiff_t width, ptrdiff_t height, ptrdiff_t log2_scale)
Definition: vf_fspp.c:113

temp
else temp
Definition: vf_mcdeint.c:256

desc
const char * desc
Definition: nvenc.c:65

AV_OPT_TYPE_INT
Definition: opt.h:223

AVFilterLink::h
int h
agreed upon image height
Definition: avfilter.h:450

AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:168

BLOCKSZ
#define BLOCKSZ
Definition: vf_fspp.h:28

FIX_1_414213562
#define FIX_1_414213562
Definition: 4xm.c:157

FIX_1_082392200
#define FIX_1_082392200
Definition: 4xm.c:156

ff_get_video_buffer
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
Definition: video.c:99

FSPPContext::threshold_mtx
uint64_t threshold_mtx[8 *2]
Definition: vf_fspp.h:58

src
#define src
Definition: vp8dsp.c:254

custom_threshold
static const short custom_threshold[64]
Definition: vf_fspp.c:68

AVFilterContext::is_disabled
int is_disabled
the enabled state from the last expression evaluation
Definition: avfilter.h:385

AVPixFmtDescriptor::log2_chroma_w
uint8_t log2_chroma_w
Amount to shift the luma width right to find the chroma width.
Definition: pixdesc.h:92

filter
static void filter(FSPPContext *p, uint8_t *dst, uint8_t *src, int dst_stride, int src_stride, int width, int height, uint8_t *qp_store, int qp_stride, int is_luma)
Definition: vf_fspp.c:149

THRESHOLD
#define THRESHOLD(r, x, t)
Definition: vf_fspp.h:39

av_calloc
void * av_calloc(size_t nmemb, size_t size)
Non-inlined equivalent of av_mallocz_array().
Definition: mem.c:244

ff_make_format_list
AVFilterFormats * ff_make_format_list(const int *fmts)
Create a list of supported formats.
Definition: formats.c:283

FSPPContext::row_fdct
void(* row_fdct)(int16_t *data, const uint8_t *pixels, ptrdiff_t line_size, int cnt)
Definition: vf_fspp.h:90

block
static int16_t block[64]
Definition: dct.c:115

DESCALE
#define DESCALE(x, n)
Definition: jfdctfst.c:135

AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:60

MULTIPLY16H
#define MULTIPLY16H(x, k)
Definition: vf_fspp.h:38

av_assert0
#define av_assert0(cond)
assert() equivalent, that is always enabled.
Definition: avassert.h:37

FSPPContext::mul_thrmat
void(* mul_thrmat)(int16_t *thr_adr_noq, int16_t *thr_adr, int q)
Definition: vf_fspp.h:82

FSPPContext::use_bframe_qp
int use_bframe_qp
Definition: vf_fspp.h:72

ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1080

uint8_t
uint8_t
Definition: audio_convert.c:194

av_cold
#define av_cold
Definition: attributes.h:82

opt.h
AVOptions.

FSPPContext
Definition: vf_fspp.h:55

row_fdct_c
static void row_fdct_c(int16_t *data, const uint8_t *pixels, ptrdiff_t line_size, int cnt)
Definition: vf_fspp.c:432

FSPPContext::non_b_qp_alloc_size
int non_b_qp_alloc_size
Definition: vf_fspp.h:71

DECLARE_ALIGNED
#define DECLARE_ALIGNED(n, t, v)
Declare a variable that is aligned in memory.
Definition: mem.h:112

height
#define height

AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range...
Definition: pixfmt.h:100

AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
Definition: pixfmt.h:79

FIX_0_382683433
#define FIX_0_382683433
Definition: jfdctfst.c:116

FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:48

MAX_LEVEL
#define MAX_LEVEL
Definition: rl.h:36

AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:54

AVFilterLink
A link between two filters.
Definition: avfilter.h:439

fspp_inputs
static const AVFilterPad fspp_inputs[]
Definition: vf_fspp.c:665

AVFrame::width
int width
Definition: frame.h:284

ff_set_common_formats
int ff_set_common_formats(AVFilterContext *ctx, AVFilterFormats *formats)
A helper for query_formats() which sets all links to the same list of formats.
Definition: formats.c:568

AVPixFmtDescriptor::log2_chroma_h
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
Definition: pixdesc.h:101

fspp_options
static const AVOption fspp_options[]
Definition: vf_fspp.c:47

ff_fspp_init_x86
void ff_fspp_init_x86(FSPPContext *fspp)
Definition: vf_fspp_init.c:37

AVERROR
#define AVERROR(e)
Definition: error.h:43

FSPPContext::src
uint8_t * src
Definition: vf_fspp.h:68

av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:202

NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:186

FSPPContext::row_idct
void(* row_idct)(int16_t *workspace, int16_t *output_adr, ptrdiff_t output_stride, int cnt)
Definition: vf_fspp.h:87

dither
static const uint8_t dither[8][8]
Definition: vf_fspp.c:57

AVFilterContext::priv
void * priv
private data for use by the filter
Definition: avfilter.h:353

FIX_1_847759065
#define FIX_1_847759065
Definition: 4xm.c:158

AVFILTER_DEFINE_CLASS
AVFILTER_DEFINE_CLASS(fspp)

avassert.h
simple assert() macros that are a bit more flexible than ISO C assert().

AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:70

DCTSIZE
#define DCTSIZE
Definition: jfdctfst.c:74

av_reallocp_array
int av_reallocp_array(void *ptr, size_t nmemb, size_t size)
Definition: mem.c:205

AVFilterLink::w
int w
agreed upon image width
Definition: avfilter.h:449

AVFrame::pict_type
enum AVPictureType pict_type
Picture type of the frame.
Definition: frame.h:309

pixdesc.h

ff_vf_fspp
AVFilter ff_vf_fspp
Definition: vf_fspp.c:683

FLAGS
#define FLAGS
Definition: vf_fspp.c:46

AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
Definition: pixfmt.h:78

width
#define width

w
uint8_t w
Definition: llviddspenc.c:38

FSPPContext::vsub
int vsub
Definition: vf_fspp.h:63

int32_t
int32_t
Definition: audio_convert.c:194

ctx
AVFormatContext * ctx
Definition: movenc.c:48

AV_OPT_TYPE_BOOL
Definition: opt.h:240

config_input
static int config_input(AVFilterLink *inlink)
Definition: vf_fspp.c:511

FIX_1_306562965
#define FIX_1_306562965
Definition: jfdctfst.c:119

inputs
static const AVFilterPad inputs[]
Definition: af_acontrast.c:193

outputs
static const AVFilterPad outputs[]
Definition: af_acontrast.c:203

AVFilterLink::format
int format
agreed upon media format
Definition: avfilter.h:456

STORE2
#define STORE2(pos)

STORE
#define STORE(pos)

FSPPContext::hsub
int hsub
Definition: vf_fspp.h:62

av_frame_is_writable
int av_frame_is_writable(AVFrame *frame)
Check if the frame data is writable.
Definition: frame.c:594

AVFrame::linesize
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Definition: frame.h:257

AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:81

in
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(constint16_t *) pi >>8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(constint32_t *) pi >>24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(constfloat *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(constfloat *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(constfloat *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(constdouble *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(constdouble *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(constdouble *) pi *(1U<< 31))))#defineSET_CONV_FUNC_GROUP(ofmt, ifmt) staticvoidset_generic_function(AudioConvert *ac){}voidff_audio_convert_free(AudioConvert **ac){if(!*ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);}AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enumAVSampleFormatout_fmt, enumAVSampleFormatin_fmt, intchannels, intsample_rate, intapply_map){AudioConvert *ac;intin_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) returnNULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method!=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt)>2){ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc){av_free(ac);returnNULL;}returnac;}in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar){ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar?ac->channels:1;}elseif(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;elseac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);returnac;}intff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in){intuse_generic=1;intlen=in->nb_samples;intp;if(ac->dc){av_log(ac->avr, AV_LOG_TRACE,"%dsamples-audio_convert:%sto%s(dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));returnff_convert_dither(ac-> in
Definition: audio_convert.c:194

AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
Definition: pixfmt.h:72

FSPPContext::store_slice2
void(* store_slice2)(uint8_t *dst, int16_t *src, ptrdiff_t dst_stride, ptrdiff_t src_stride, ptrdiff_t width, ptrdiff_t height, ptrdiff_t log2_scale)
Definition: vf_fspp.h:78

AVFilter
Filter definition.
Definition: avfilter.h:144

index
int index
Definition: gxfenc.c:89

uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: vf_fspp.c:657

store_slice_c
static void store_slice_c(uint8_t *dst, int16_t *src, ptrdiff_t dst_stride, ptrdiff_t src_stride, ptrdiff_t width, ptrdiff_t height, ptrdiff_t log2_scale)
Definition: vf_fspp.c:83

FIX_0_707106781
#define FIX_0_707106781
Definition: jfdctfst.c:118

OFFSET
#define OFFSET(x)
Definition: vf_fspp.c:45

FSPPContext::strength
int strength
Definition: vf_fspp.h:61

AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:148

query_formats
static int query_formats(AVFilterContext *ctx)
Definition: vf_fspp.c:493

AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
Definition: avfilter.h:133

AVFilterContext::outputs
AVFilterLink ** outputs
array of pointers to output links
Definition: avfilter.h:350

FSPPContext::qscale_type
int qscale_type
Definition: vf_fspp.h:66

ff_norm_qscale
static int ff_norm_qscale(int qscale, int type)
Normalize the qscale factor FIXME the H264 qscale is a log based scale, mpeg1/2 is not...
Definition: internal.h:397

pix_fmts
static enum AVPixelFormat pix_fmts[]
Definition: libkvazaar.c:266

row_idct_c
static void row_idct_c(int16_t *workspace, int16_t *output_adr, ptrdiff_t output_stride, int cnt)
Definition: vf_fspp.c:370

flags
#define flags(name, subs,...)
Definition: cbs_av1.c:596

AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:240

FSPPContext::store_slice
void(* store_slice)(uint8_t *dst, int16_t *src, ptrdiff_t dst_stride, ptrdiff_t src_stride, ptrdiff_t width, ptrdiff_t height, ptrdiff_t log2_scale)
Definition: vf_fspp.h:74

FIX_2_613125930
#define FIX_2_613125930
Definition: 4xm.c:159

stride
GLint GLenum GLboolean GLsizei stride
Definition: opengl_enc.c:105

AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:66

AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:74

mul_thrmat_c
static void mul_thrmat_c(int16_t *thr_adr_noq, int16_t *thr_adr, int q)
Definition: vf_fspp.c:142

AV_PICTURE_TYPE_B
Bi-dir predicted.
Definition: avutil.h:276

AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
Definition: pixfmt.h:80

AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
Definition: pixfmt.h:73

FSPPContext::column_fidct
void(* column_fidct)(int16_t *thr_adr, int16_t *data, int16_t *output, int cnt)
Definition: vf_fspp.h:84

FIX_0_541196100
#define FIX_0_541196100
Definition: jfdctfst.c:117

pixels
int pixels
Definition: avisynth_c.h:429

vf_fspp.h

AVFilterLink::dst
AVFilterContext * dst
dest filter
Definition: avfilter.h:443

filter_frame
static int filter_frame(AVFilterLink *inlink, AVFrame *in)
Definition: vf_fspp.c:548

int_simd16_t
int32_t int_simd16_t
Definition: vf_fspp.h:44

AVFilterFormats
A list of supported formats for one end of a filter link.
Definition: formats.h:64

AVFilterContext
An instance of a filter.
Definition: avfilter.h:338

AVFrame::height
int height
Definition: frame.h:284

FSPPContext::qp
int qp
Definition: vf_fspp.h:65

out
FILE * out
Definition: movenc.c:54

FSPPContext::log2_count
int log2_count
Definition: vf_fspp.h:60

av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35

AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
Definition: pixfmt.h:99

AVMEDIA_TYPE_VIDEO
Definition: avutil.h:201

fspp_outputs
static const AVFilterPad fspp_outputs[]
Definition: vf_fspp.c:675

av_malloc_array
#define av_malloc_array(a, b)
Definition: tableprint_vlc.h:32

FSPPContext::prev_q
int prev_q
Definition: vf_fspp.h:67

av_image_copy_plane
void av_image_copy_plane(uint8_t *dst, int dst_linesize, const uint8_t *src, int src_linesize, int bytewidth, int height)
Copy image plane from src to dst.
Definition: imgutils.c:338

FSPPContext::temp_stride
int temp_stride
Definition: vf_fspp.h:64

stride
#define stride

internal.h
internal API functions

av_frame_get_qp_table
int8_t * av_frame_get_qp_table(AVFrame *f, int *stride, int *type)
Definition: frame.c:90

FSPPContext::temp
int16_t * temp
Definition: vf_fspp.h:69

AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:64

for
for(j=16;j >0;--j)
Definition: h264pred_template.c:469

av_frame_copy_props
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
Definition: frame.c:654

ch
uint8_t pi<< 24) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_U8,(uint64_t)((*(constuint8_t *) pi-0x80U))<< 56) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8,(*(constuint8_t *) pi-0x80)*(1.0f/(1<< 7))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8,(*(constuint8_t *) pi-0x80)*(1.0/(1<< 7))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16,(*(constint16_t *) pi >>8)+0x80) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_S16,(uint64_t)(*(constint16_t *) pi)<< 48) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16,*(constint16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16,*(constint16_t *) pi *(1.0/(1<< 15))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32,(*(constint32_t *) pi >>24)+0x80) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_S32,(uint64_t)(*(constint32_t *) pi)<< 32) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32,*(constint32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32,*(constint32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S64,(*(constint64_t *) pi >>56)+0x80) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S64,*(constint64_t *) pi *(1.0f/(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S64,*(constint64_t *) pi *(1.0/(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, av_clip_uint8(lrintf(*(constfloat *) pi *(1<< 7))+0x80)) CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, av_clip_int16(lrintf(*(constfloat *) pi *(1<< 15)))) CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, av_clipl_int32(llrintf(*(constfloat *) pi *(1U<< 31)))) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_FLT, llrintf(*(constfloat *) pi *(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, av_clip_uint8(lrint(*(constdouble *) pi *(1<< 7))+0x80)) CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, av_clip_int16(lrint(*(constdouble *) pi *(1<< 15)))) CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, av_clipl_int32(llrint(*(constdouble *) pi *(1U<< 31)))) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_DBL, llrint(*(constdouble *) pi *(INT64_C(1)<< 63)))#defineFMT_PAIR_FUNC(out, in) staticconv_func_type *constfmt_pair_to_conv_functions[AV_SAMPLE_FMT_NB *AV_SAMPLE_FMT_NB]={FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S64),};staticvoidcpy1(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, len);}staticvoidcpy2(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, 2 *len);}staticvoidcpy4(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, 4 *len);}staticvoidcpy8(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, 8 *len);}AudioConvert *swri_audio_convert_alloc(enumAVSampleFormatout_fmt, enumAVSampleFormatin_fmt, intchannels, constint *ch_map, intflags){AudioConvert *ctx;conv_func_type *f=fmt_pair_to_conv_functions[av_get_packed_sample_fmt(out_fmt)+AV_SAMPLE_FMT_NB *av_get_packed_sample_fmt(in_fmt)];if(!f) returnNULL;ctx=av_mallocz(sizeof(*ctx));if(!ctx) returnNULL;if(channels==1){in_fmt=av_get_planar_sample_fmt(in_fmt);out_fmt=av_get_planar_sample_fmt(out_fmt);}ctx->channels=channels;ctx->conv_f=f;ctx->ch_map=ch_map;if(in_fmt==AV_SAMPLE_FMT_U8||in_fmt==AV_SAMPLE_FMT_U8P) memset(ctx->silence, 0x80, sizeof(ctx->silence));if(out_fmt==in_fmt &&!ch_map){switch(av_get_bytes_per_sample(in_fmt)){case1:ctx->simd_f=cpy1;break;case2:ctx->simd_f=cpy2;break;case4:ctx->simd_f=cpy4;break;case8:ctx->simd_f=cpy8;break;}}if(HAVE_X86ASM &&1) swri_audio_convert_init_x86(ctx, out_fmt, in_fmt, channels);if(ARCH_ARM) swri_audio_convert_init_arm(ctx, out_fmt, in_fmt, channels);if(ARCH_AARCH64) swri_audio_convert_init_aarch64(ctx, out_fmt, in_fmt, channels);returnctx;}voidswri_audio_convert_free(AudioConvert **ctx){av_freep(ctx);}intswri_audio_convert(AudioConvert *ctx, AudioData *out, AudioData *in, intlen){intch;intoff=0;constintos=(out->planar?1:out->ch_count)*out->bps;unsignedmisaligned=0;av_assert0(ctx->channels==out->ch_count);if(ctx->in_simd_align_mask){intplanes=in->planar?in->ch_count:1;unsignedm=0;for(ch=0;ch< planes;ch++) m|=(intptr_t) in->ch[ch];misaligned|=m &ctx->in_simd_align_mask;}if(ctx->out_simd_align_mask){intplanes=out->planar?out->ch_count:1;unsignedm=0;for(ch=0;ch< planes;ch++) m|=(intptr_t) out->ch[ch];misaligned|=m &ctx->out_simd_align_mask;}if(ctx->simd_f &&!ctx->ch_map &&!misaligned){off=len &~15;av_assert1(off >=0);av_assert1(off<=len);av_assert2(ctx->channels==SWR_CH_MAX||!in->ch[ctx->channels]);if(off >0){if(out->planar==in->planar){intplanes=out->planar?out->ch_count:1;for(ch=0;ch< planes;ch++){ctx->simd_f(out-> ch ch
Definition: audioconvert.c:56

a
a
Definition: h264pred_template.c:468

AV_CEIL_RSHIFT
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:58