doxygen/3.2/vf__nnedi_8c_source.html

 /*

  * Copyright (C) 2010-2011 Kevin Stone

  * Copyright (C) 2016 Paul B Mahol

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or modify

  * it under the terms of the GNU General Public License as published by

  * the Free Software Foundation; either version 2 of the License, or

  * (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the

  * GNU General Public License for more details.

  *

  * You should have received a copy of the GNU General Public License along

  * with FFmpeg; if not, write to the Free Software Foundation, Inc.,

  * 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA.

  */


 #include <float.h>


 #include "libavutil/common.h"

 #include "libavutil/float_dsp.h"

 #include "libavutil/imgutils.h"

 #include "libavutil/opt.h"

 #include "libavutil/pixdesc.h"

 #include "avfilter.h"

 #include "formats.h"

 #include "internal.h"

 #include "video.h"


 typedef struct FrameData {

     uint8_t *paddedp[3];

     int padded_stride[3];

     int padded_width[3];

     int padded_height[3];


     uint8_t *dstp[3];

     int dst_stride[3];


     int field[3];


     int32_t *lcount[3];

     float *input;

     float *temp;

 } FrameData;


 typedef struct NNEDIContext {

     const AVClass *class;


     char *weights_file;


     AVFrame *src;

     AVFrame *second;

     AVFrame *dst;

     int eof;

     int64_t cur_pts;


     AVFloatDSPContext *fdsp;

     int nb_planes;

     int linesize[4];

     int planeheight[4];


     float *weights0;

     float *weights1[2];

     int asize;

     int nns;

     int xdia;

     int ydia;


     // Parameters

     int deint;

     int field;

     int process_plane;

     int nsize;

     int nnsparam;

     int qual;

     int etype;

     int pscrn;

     int fapprox;


     int max_value;


     void (*copy_pad)(const AVFrame *, FrameData *, struct NNEDIContext *, int);

     void (*evalfunc_0)(struct NNEDIContext *, FrameData *);

     void (*evalfunc_1)(struct NNEDIContext *, FrameData *);


     // Functions used in evalfunc_0

     void (*readpixels)(const uint8_t *, const int, float *);

     void (*compute_network0)(struct NNEDIContext *s, const float *, const float *, uint8_t *);

     int32_t (*process_line0)(const uint8_t *, int, uint8_t *, const uint8_t *, const int, const int, const int);


     // Functions used in evalfunc_1

     void (*extract)(const uint8_t *, const int, const int, const int, float *, float *);

     void (*dot_prod)(struct NNEDIContext *, const float *, const float *, float *, const int, const int, const float *);

     void (*expfunc)(float *, const int);

     void (*wae5)(const float *, const int, float *);


     FrameData frame_data;

 } NNEDIContext;


 #define OFFSET(x) offsetof(NNEDIContext, x)

 #define FLAGS AV_OPT_FLAG_VIDEO_PARAM|AV_OPT_FLAG_FILTERING_PARAM


 static const AVOption nnedi_options[] = {

     {"weights",  "set weights file", OFFSET(weights_file),  AV_OPT_TYPE_STRING, {.str="nnedi3_weights.bin"}, 0, 0, FLAGS },

     {"deint",         "set which frames to deinterlace", OFFSET(deint),         AV_OPT_TYPE_INT, {.i64=0}, 0, 1, FLAGS, "deint" },

         {"all",        "deinterlace all frames",                       0, AV_OPT_TYPE_CONST, {.i64=0}, 0, 0, FLAGS, "deint" },

         {"interlaced", "only deinterlace frames marked as interlaced", 0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, FLAGS, "deint" },

     {"field",  "set mode of operation", OFFSET(field),         AV_OPT_TYPE_INT, {.i64=-1}, -2, 3, FLAGS, "field" },

         {"af", "use frame flags, both fields",  0, AV_OPT_TYPE_CONST, {.i64=-2}, 0, 0, FLAGS, "field" },

         {"a",  "use frame flags, single field", 0, AV_OPT_TYPE_CONST, {.i64=-1}, 0, 0, FLAGS, "field" },

         {"t",  "use top field only",            0, AV_OPT_TYPE_CONST, {.i64=0},  0, 0, FLAGS, "field" },

         {"b",  "use bottom field only",         0, AV_OPT_TYPE_CONST, {.i64=1},  0, 0, FLAGS, "field" },

         {"tf", "use both fields, top first",    0, AV_OPT_TYPE_CONST, {.i64=2}, 0, 0, FLAGS, "field" },

         {"bf", "use both fields, bottom first", 0, AV_OPT_TYPE_CONST, {.i64=3}, 0, 0, FLAGS, "field" },

     {"planes", "set which planes to process", OFFSET(process_plane), AV_OPT_TYPE_INT, {.i64=7}, 0, 7, FLAGS },

     {"nsize",  "set size of local neighborhood around each pixel, used by the predictor neural network", OFFSET(nsize), AV_OPT_TYPE_INT, {.i64=6}, 0, 6, FLAGS, "nsize" },

         {"s8x6",     NULL, 0, AV_OPT_TYPE_CONST, {.i64=0}, 0, 0, FLAGS, "nsize" },

         {"s16x6",    NULL, 0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, FLAGS, "nsize" },

         {"s32x6",    NULL, 0, AV_OPT_TYPE_CONST, {.i64=2}, 0, 0, FLAGS, "nsize" },

         {"s48x6",    NULL, 0, AV_OPT_TYPE_CONST, {.i64=3}, 0, 0, FLAGS, "nsize" },

         {"s8x4",     NULL, 0, AV_OPT_TYPE_CONST, {.i64=4}, 0, 0, FLAGS, "nsize" },

         {"s16x4",    NULL, 0, AV_OPT_TYPE_CONST, {.i64=5}, 0, 0, FLAGS, "nsize" },

         {"s32x4",    NULL, 0, AV_OPT_TYPE_CONST, {.i64=6}, 0, 0, FLAGS, "nsize" },

     {"nns",    "set number of neurons in predictor neural network", OFFSET(nnsparam), AV_OPT_TYPE_INT, {.i64=1}, 0, 4, FLAGS, "nns" },

         {"n16",       NULL, 0, AV_OPT_TYPE_CONST, {.i64=0}, 0, 0, FLAGS, "nns" },

         {"n32",       NULL, 0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, FLAGS, "nns" },

         {"n64",       NULL, 0, AV_OPT_TYPE_CONST, {.i64=2}, 0, 0, FLAGS, "nns" },

         {"n128",      NULL, 0, AV_OPT_TYPE_CONST, {.i64=3}, 0, 0, FLAGS, "nns" },

         {"n256",      NULL, 0, AV_OPT_TYPE_CONST, {.i64=4}, 0, 0, FLAGS, "nns" },

     {"qual",  "set quality", OFFSET(qual), AV_OPT_TYPE_INT, {.i64=1}, 1, 2, FLAGS, "qual" },

         {"fast", NULL, 0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, FLAGS, "qual" },

         {"slow", NULL, 0, AV_OPT_TYPE_CONST, {.i64=2}, 0, 0, FLAGS, "qual" },

     {"etype", "set which set of weights to use in the predictor", OFFSET(etype), AV_OPT_TYPE_INT, {.i64=0}, 0, 1, FLAGS, "etype" },

         {"a",  "weights trained to minimize absolute error", 0, AV_OPT_TYPE_CONST, {.i64=0}, 0, 0, FLAGS, "etype" },

         {"s",  "weights trained to minimize squared error",  0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, FLAGS, "etype" },

     {"pscrn", "set prescreening", OFFSET(pscrn), AV_OPT_TYPE_INT, {.i64=2}, 0, 2, FLAGS, "pscrn" },

         {"none",      NULL, 0, AV_OPT_TYPE_CONST, {.i64=0}, 0, 0, FLAGS, "pscrn" },

         {"original",  NULL, 0, AV_OPT_TYPE_CONST, {.i64=1}, 0, 0, FLAGS, "pscrn" },

         {"new",       NULL, 0, AV_OPT_TYPE_CONST, {.i64=2}, 0, 0, FLAGS, "pscrn" },

     {"fapprox",       NULL, OFFSET(fapprox),       AV_OPT_TYPE_INT, {.i64=0}, 0, 3, FLAGS },

     { NULL }

 };


 AVFILTER_DEFINE_CLASS(nnedi);


 static int config_input(AVFilterLink *inlink)

 {

     AVFilterContext *ctx = inlink->dst;

     NNEDIContext *s = ctx->priv;

     const AVPixFmtDescriptor *desc = av_pix_fmt_desc_get(inlink->format);

     int ret;


     s->nb_planes = av_pix_fmt_count_planes(inlink->format);

     if ((ret = av_image_fill_linesizes(s->linesize, inlink->format, inlink->w)) < 0)

         return ret;


     s->planeheight[1] = s->planeheight[2] = AV_CEIL_RSHIFT(inlink->h, desc->log2_chroma_h);

     s->planeheight[0] = s->planeheight[3] = inlink->h;


     return 0;

 }


 static int config_output(AVFilterLink *outlink)

 {

     AVFilterContext *ctx = outlink->src;

     NNEDIContext *s = ctx->priv;


     outlink->time_base.num = ctx->inputs[0]->time_base.num;

     outlink->time_base.den = ctx->inputs[0]->time_base.den * 2;

     outlink->w             = ctx->inputs[0]->w;

     outlink->h             = ctx->inputs[0]->h;


     if (s->field > 1 || s->field == -2)

         outlink->frame_rate = av_mul_q(ctx->inputs[0]->frame_rate,

                                        (AVRational){2, 1});


     return 0;

 }


 static int query_formats(AVFilterContext *ctx)

 {

     static const enum AVPixelFormat pix_fmts[] = {

         AV_PIX_FMT_YUV410P, AV_PIX_FMT_YUV411P,

         AV_PIX_FMT_YUV420P, AV_PIX_FMT_YUV422P,

         AV_PIX_FMT_YUV440P, AV_PIX_FMT_YUV444P,

         AV_PIX_FMT_YUVJ444P, AV_PIX_FMT_YUVJ440P,

         AV_PIX_FMT_YUVJ422P, AV_PIX_FMT_YUVJ420P,

         AV_PIX_FMT_YUVJ411P,

         AV_PIX_FMT_GBRP,

         AV_PIX_FMT_GRAY8,

         AV_PIX_FMT_NONE

     };


     AVFilterFormats *fmts_list = ff_make_format_list(pix_fmts);

     if (!fmts_list)

         return AVERROR(ENOMEM);

     return ff_set_common_formats(ctx, fmts_list);

 }


 static void copy_pad(const AVFrame *src, FrameData *frame_data, NNEDIContext *s, int fn)

 {

     const int off = 1 - fn;

     int plane, y, x;


     for (plane = 0; plane < s->nb_planes; plane++) {

         const uint8_t *srcp = (const uint8_t *)src->data[plane];

         uint8_t *dstp = (uint8_t *)frame_data->paddedp[plane];


         const int src_stride = src->linesize[plane];

         const int dst_stride = frame_data->padded_stride[plane];


         const int src_height = s->planeheight[plane];

         const int dst_height = frame_data->padded_height[plane];


         const int src_width = s->linesize[plane];

         const int dst_width = frame_data->padded_width[plane];


         int c = 4;


         if (!(s->process_plane & (1 << plane)))

             continue;


         // Copy.

         for (y = off; y < src_height; y += 2)

             memcpy(dstp + 32 + (6 + y) * dst_stride,

                    srcp + y * src_stride,

                    src_width * sizeof(uint8_t));


         // And pad.

         dstp += (6 + off) * dst_stride;

         for (y = 6 + off; y < dst_height - 6; y += 2) {

             int c = 2;


             for (x = 0; x < 32; x++)

                 dstp[x] = dstp[64 - x];


             for (x = dst_width - 32; x < dst_width; x++, c += 2)

                 dstp[x] = dstp[x - c];


             dstp += dst_stride * 2;

         }


         dstp = (uint8_t *)frame_data->paddedp[plane];

         for (y = off; y < 6; y += 2)

             memcpy(dstp + y * dst_stride,

                    dstp + (12 + 2 * off - y) * dst_stride,

                    dst_width * sizeof(uint8_t));


         for (y = dst_height - 6 + off; y < dst_height; y += 2, c += 4)

             memcpy(dstp + y * dst_stride,

                    dstp + (y - c) * dst_stride,

                    dst_width * sizeof(uint8_t));

     }

 }


 static void elliott(float *data, const int n)

 {

     int i;


     for (i = 0; i < n; i++)

         data[i] = data[i] / (1.0f + FFABS(data[i]));

 }


 static void dot_prod(NNEDIContext *s, const float *data, const float *weights, float *vals, const int n, const int len, const float *scale)

 {

     int i;


     for (i = 0; i < n; i++) {

         float sum;


         sum = s->fdsp->scalarproduct_float(data, &weights[i * len], len);


         vals[i] = sum * scale[0] + weights[n * len + i];

     }

 }


 static void dot_prods(NNEDIContext *s, const float *dataf, const float *weightsf, float *vals, const int n, const int len, const float *scale)

 {

     const int16_t *data = (int16_t *)dataf;

     const int16_t *weights = (int16_t *)weightsf;

     const float *wf = (float *)&weights[n * len];

     int i, j;


     for (i = 0; i < n; i++) {

         int sum = 0, off = ((i >> 2) << 3) + (i & 3);

         for (j = 0; j < len; j++)

             sum += data[j] * weights[i * len + j];


         vals[i] = sum * wf[off] * scale[0] + wf[off + 4];

     }

 }


 static void compute_network0(NNEDIContext *s, const float *input, const float *weights, uint8_t *d)

 {

     float t, temp[12], scale = 1.0f;


     dot_prod(s, input, weights, temp, 4, 48, &scale);

     t = temp[0];

     elliott(temp, 4);

     temp[0] = t;

     dot_prod(s, temp, weights + 4 * 49, temp + 4, 4, 4, &scale);

     elliott(temp + 4, 4);

     dot_prod(s, temp, weights + 4 * 49 + 4 * 5, temp + 8, 4, 8, &scale);

     if (FFMAX(temp[10], temp[11]) <= FFMAX(temp[8], temp[9]))

         d[0] = 1;

     else

         d[0] = 0;

 }


 static void compute_network0_i16(NNEDIContext *s, const float *inputf, const float *weightsf, uint8_t *d)

 {

     const float *wf = weightsf + 2 * 48;

     float t, temp[12], scale = 1.0f;


     dot_prods(s, inputf, weightsf, temp, 4, 48, &scale);

     t = temp[0];

     elliott(temp, 4);

     temp[0] = t;

     dot_prod(s, temp, wf + 8, temp + 4, 4, 4, &scale);

     elliott(temp + 4, 4);

     dot_prod(s, temp, wf + 8 + 4 * 5, temp + 8, 4, 8, &scale);

     if (FFMAX(temp[10], temp[11]) <= FFMAX(temp[8], temp[9]))

         d[0] = 1;

     else

         d[0] = 0;

 }


 static void pixel2float48(const uint8_t *t8, const int pitch, float *p)

 {

     const uint8_t *t = (const uint8_t *)t8;

     int y, x;


     for (y = 0; y < 4; y++)

         for (x = 0; x < 12; x++)

             p[y * 12 + x] = t[y * pitch * 2 + x];

 }


 static void byte2word48(const uint8_t *t, const int pitch, float *pf)

 {

     int16_t *p = (int16_t *)pf;

     int y, x;


     for (y = 0; y < 4; y++)

         for (x = 0; x < 12; x++)

             p[y * 12 + x] = t[y * pitch * 2 + x];

 }


 static int32_t process_line0(const uint8_t *tempu, int width, uint8_t *dstp8, const uint8_t *src3p8, const int src_pitch, const int max_value, const int chroma)

 {

     uint8_t *dstp = (uint8_t *)dstp8;

     const uint8_t *src3p = (const uint8_t *)src3p8;

     int minimum = 0;

     int maximum = max_value - 1; // Technically the -1 is only needed for 8 and 16 bit input.

     int count = 0, x;

     for (x = 0; x < width; x++) {

         if (tempu[x]) {

             int tmp = 19 * (src3p[x + src_pitch * 2] + src3p[x + src_pitch * 4]) - 3 * (src3p[x] + src3p[x + src_pitch * 6]);

             tmp /= 32;

             dstp[x] = FFMAX(FFMIN(tmp, maximum), minimum);

         } else {

             dstp[x] = 255;

             count++;

         }

     }

     return count;

 }


 // new prescreener functions

 static void byte2word64(const uint8_t *t, const int pitch, float *p)

 {

     int16_t *ps = (int16_t *)p;

     int y, x;


     for (y = 0; y < 4; y++)

         for (x = 0; x < 16; x++)

             ps[y * 16 + x] = t[y * pitch * 2 + x];

 }


 static void compute_network0new(NNEDIContext *s, const float *datai, const float *weights, uint8_t *d)

 {

     int16_t *data = (int16_t *)datai;

     int16_t *ws = (int16_t *)weights;

     float *wf = (float *)&ws[4 * 64];

     float vals[8];

     int mask, i, j;


     for (i = 0; i < 4; i++) {

         int sum = 0;

         float t;


         for (j = 0; j < 64; j++)

             sum += data[j] * ws[(i << 3) + ((j >> 3) << 5) + (j & 7)];

         t = sum * wf[i] + wf[4 + i];

         vals[i] = t / (1.0f + FFABS(t));

     }


     for (i = 0; i < 4; i++) {

         float sum = 0.0f;


         for (j = 0; j < 4; j++)

             sum += vals[j] * wf[8 + i + (j << 2)];

         vals[4 + i] = sum + wf[8 + 16 + i];

     }


     mask = 0;

     for (i = 0; i < 4; i++) {

         if (vals[4 + i] > 0.0f)

             mask |= (0x1 << (i << 3));

     }


     ((int *)d)[0] = mask;

 }


 static void evalfunc_0(NNEDIContext *s, FrameData *frame_data)

 {

     float *input = frame_data->input;

     const float *weights0 = s->weights0;

     float *temp = frame_data->temp;

     uint8_t *tempu = (uint8_t *)temp;

     int plane, x, y;


     // And now the actual work.

     for (plane = 0; plane < s->nb_planes; plane++) {

         const uint8_t *srcp = (const uint8_t *)frame_data->paddedp[plane];

         const int src_stride = frame_data->padded_stride[plane] / sizeof(uint8_t);


         const int width = frame_data->padded_width[plane];

         const int height = frame_data->padded_height[plane];


         uint8_t *dstp = (uint8_t *)frame_data->dstp[plane];

         const int dst_stride = frame_data->dst_stride[plane] / sizeof(uint8_t);

         const uint8_t *src3p;

         int ystart, ystop;

         int32_t *lcount;


         if (!(s->process_plane & (1 << plane)))

             continue;


         for (y = 1 - frame_data->field[plane]; y < height - 12; y += 2) {

             memcpy(dstp + y * dst_stride,

                    srcp + 32 + (6 + y) * src_stride,

                    (width - 64) * sizeof(uint8_t));


         }


         ystart = 6 + frame_data->field[plane];

         ystop = height - 6;

         srcp += ystart * src_stride;

         dstp += (ystart - 6) * dst_stride - 32;

         src3p = srcp - src_stride * 3;

         lcount = frame_data->lcount[plane] - 6;


         if (s->pscrn == 1) { // original

             for (y = ystart; y < ystop; y += 2) {

                 for (x = 32; x < width - 32; x++) {

                     s->readpixels((const uint8_t *)(src3p + x - 5), src_stride, input);

                     s->compute_network0(s, input, weights0, tempu+x);

                 }

                 lcount[y] += s->process_line0(tempu + 32, width - 64, (uint8_t *)(dstp + 32), (const uint8_t *)(src3p + 32), src_stride, s->max_value, plane);

                 src3p += src_stride * 2;

                 dstp += dst_stride * 2;

             }

         } else if (s->pscrn > 1) { // new

             for (y = ystart; y < ystop; y += 2) {

                 for (x = 32; x < width - 32; x += 4) {

                     s->readpixels((const uint8_t *)(src3p + x - 6), src_stride, input);

                     s->compute_network0(s, input, weights0, tempu + x);

                 }

                 lcount[y] += s->process_line0(tempu + 32, width - 64, (uint8_t *)(dstp + 32), (const uint8_t *)(src3p + 32), src_stride, s->max_value, plane);

                 src3p += src_stride * 2;

                 dstp += dst_stride * 2;

             }

         } else { // no prescreening

             for (y = ystart; y < ystop; y += 2) {

                 memset(dstp + 32, 255, (width - 64) * sizeof(uint8_t));

                 lcount[y] += width - 64;

                 dstp += dst_stride * 2;

             }

         }

     }

 }


 static void extract_m8(const uint8_t *srcp8, const int stride, const int xdia, const int ydia, float *mstd, float *input)

 {

     // uint8_t or uint16_t or float

     const uint8_t *srcp = (const uint8_t *)srcp8;

     float scale;

     double tmp;


     // int32_t or int64_t or double

     int64_t sum = 0, sumsq = 0;

     int y, x;


     for (y = 0; y < ydia; y++) {

         const uint8_t *srcpT = srcp + y * stride * 2;


         for (x = 0; x < xdia; x++) {

             sum += srcpT[x];

             sumsq += (uint32_t)srcpT[x] * (uint32_t)srcpT[x];

             input[x] = srcpT[x];

         }

         input += xdia;

     }

     scale = 1.0f / (xdia * ydia);

     mstd[0] = sum * scale;

     tmp = (double)sumsq * scale - (double)mstd[0] * mstd[0];

     mstd[3] = 0.0f;

     if (tmp <= FLT_EPSILON)

         mstd[1] = mstd[2] = 0.0f;

     else {

         mstd[1] = sqrt(tmp);

         mstd[2] = 1.0f / mstd[1];

     }

 }


 static void extract_m8_i16(const uint8_t *srcp, const int stride, const int xdia, const int ydia, float *mstd, float *inputf)

 {

     int16_t *input = (int16_t *)inputf;

     float scale;

     int sum = 0, sumsq = 0;

     int y, x;


     for (y = 0; y < ydia; y++) {

         const uint8_t *srcpT = srcp + y * stride * 2;

         for (x = 0; x < xdia; x++) {

             sum += srcpT[x];

             sumsq += srcpT[x] * srcpT[x];

             input[x] = srcpT[x];

         }

         input += xdia;

     }

     scale = 1.0f / (float)(xdia * ydia);

     mstd[0] = sum * scale;

     mstd[1] = sumsq * scale - mstd[0] * mstd[0];

     mstd[3] = 0.0f;

     if (mstd[1] <= FLT_EPSILON)

         mstd[1] = mstd[2] = 0.0f;

     else {

         mstd[1] = sqrt(mstd[1]);

         mstd[2] = 1.0f / mstd[1];

     }

 }


 static const float exp_lo = -80.0f;

 static const float exp_hi = +80.0f;


 static void e2_m16(float *s, const int n)

 {

     int i;


     for (i = 0; i < n; i++)

         s[i] = exp(av_clipf(s[i], exp_lo, exp_hi));

 }


 const float min_weight_sum = 1e-10f;


 static void weighted_avg_elliott_mul5_m16(const float *w, const int n, float *mstd)

 {

     float vsum = 0.0f, wsum = 0.0f;

     int i;


     for (i = 0; i < n; i++) {

         vsum += w[i] * (w[n + i] / (1.0f + FFABS(w[n + i])));

         wsum += w[i];

     }

     if (wsum > min_weight_sum)

         mstd[3] += ((5.0f * vsum) / wsum) * mstd[1] + mstd[0];

     else

         mstd[3] += mstd[0];

 }


 static void evalfunc_1(NNEDIContext *s, FrameData *frame_data)

 {

     float *input = frame_data->input;

     float *temp = frame_data->temp;

     float **weights1 = s->weights1;

     const int qual = s->qual;

     const int asize = s->asize;

     const int nns = s->nns;

     const int xdia = s->xdia;

     const int xdiad2m1 = (xdia / 2) - 1;

     const int ydia = s->ydia;

     const float scale = 1.0f / (float)qual;

     int plane, y, x, i;


     for (plane = 0; plane < s->nb_planes; plane++) {

         const uint8_t *srcp = (const uint8_t *)frame_data->paddedp[plane];

         const int src_stride = frame_data->padded_stride[plane] / sizeof(uint8_t);


         const int width = frame_data->padded_width[plane];

         const int height = frame_data->padded_height[plane];


         uint8_t *dstp = (uint8_t *)frame_data->dstp[plane];

         const int dst_stride = frame_data->dst_stride[plane] / sizeof(uint8_t);


         const int ystart = frame_data->field[plane];

         const int ystop = height - 12;

         const uint8_t *srcpp;


         if (!(s->process_plane & (1 << plane)))

             continue;


         srcp += (ystart + 6) * src_stride;

         dstp += ystart * dst_stride - 32;

         srcpp = srcp - (ydia - 1) * src_stride - xdiad2m1;


         for (y = ystart; y < ystop; y += 2) {

             for (x = 32; x < width - 32; x++) {

                 float mstd[4];


                 if (dstp[x] != 255)

                     continue;


                 s->extract((const uint8_t *)(srcpp + x), src_stride, xdia, ydia, mstd, input);

                 for (i = 0; i < qual; i++) {

                     s->dot_prod(s, input, weights1[i], temp, nns * 2, asize, mstd + 2);

                     s->expfunc(temp, nns);

                     s->wae5(temp, nns, mstd);

                 }


                 dstp[x] = FFMIN(FFMAX((int)(mstd[3] * scale + 0.5f), 0), s->max_value);

             }

             srcpp += src_stride * 2;

             dstp += dst_stride * 2;

         }

     }

 }


 #define NUM_NSIZE 7

 #define NUM_NNS 5


 static int roundds(const double f)

 {

     if (f - floor(f) >= 0.5)

         return FFMIN((int)ceil(f), 32767);

     return FFMAX((int)floor(f), -32768);

 }


 static void select_functions(NNEDIContext *s)

 {

     s->copy_pad = copy_pad;

     s->evalfunc_0 = evalfunc_0;

     s->evalfunc_1 = evalfunc_1;


     // evalfunc_0

     s->process_line0 = process_line0;


     if (s->pscrn < 2) { // original prescreener

         if (s->fapprox & 1) { // int16 dot products

             s->readpixels = byte2word48;

             s->compute_network0 = compute_network0_i16;

         } else {

             s->readpixels = pixel2float48;

             s->compute_network0 = compute_network0;

         }

     } else { // new prescreener

         // only int16 dot products

         s->readpixels = byte2word64;

         s->compute_network0 = compute_network0new;

     }


     // evalfunc_1

     s->wae5 = weighted_avg_elliott_mul5_m16;


     if (s->fapprox & 2) { // use int16 dot products

         s->extract = extract_m8_i16;

         s->dot_prod = dot_prods;

     } else { // use float dot products

         s->extract = extract_m8;

         s->dot_prod = dot_prod;

     }


     s->expfunc = e2_m16;

 }


 static int modnpf(const int m, const int n)

 {

     if ((m % n) == 0)

         return m;

     return m + n - (m % n);

 }


 static int get_frame(AVFilterContext *ctx, int is_second)

 {

     NNEDIContext *s = ctx->priv;

     AVFilterLink *outlink = ctx->outputs[0];

     AVFrame *src = s->src;

     FrameData *frame_data;

     int effective_field = s->field;

     size_t temp_size;

     int field_n;

     int plane;


     if (effective_field > 1)

         effective_field -= 2;

     else if (effective_field < 0)

         effective_field += 2;


     if (s->field < 0 && src->interlaced_frame && src->top_field_first == 0)

         effective_field = 0;

     else if (s->field < 0 && src->interlaced_frame && src->top_field_first == 1)

         effective_field = 1;

     else

         effective_field = !effective_field;


     if (s->field > 1 || s->field == -2) {

         if (is_second) {

             field_n = (effective_field == 0);

         } else {

             field_n = (effective_field == 1);

         }

     } else {

         field_n = effective_field;

     }


     s->dst = ff_get_video_buffer(outlink, outlink->w, outlink->h);

     if (!s->dst)

         return AVERROR(ENOMEM);

     av_frame_copy_props(s->dst, src);

     s->dst->interlaced_frame = 0;


     frame_data = &s->frame_data;


     for (plane = 0; plane < s->nb_planes; plane++) {

         int dst_height = s->planeheight[plane];

         int dst_width = s->linesize[plane];


         const int min_alignment = 16;

         const int min_pad = 10;


         if (!(s->process_plane & (1 << plane))) {

             av_image_copy_plane(s->dst->data[plane], s->dst->linesize[plane],

                                 src->data[plane], src->linesize[plane],

                                 s->linesize[plane],

                                 s->planeheight[plane]);

             continue;

         }


         frame_data->padded_width[plane]  = dst_width + 64;

         frame_data->padded_height[plane] = dst_height + 12;

         frame_data->padded_stride[plane] = modnpf(frame_data->padded_width[plane] + min_pad, min_alignment); // TODO: maybe min_pad is in pixels too?

         if (!frame_data->paddedp[plane]) {

             frame_data->paddedp[plane] = av_malloc_array(frame_data->padded_stride[plane], frame_data->padded_height[plane]);

             if (!frame_data->paddedp[plane])

                 return AVERROR(ENOMEM);

         }


         frame_data->dstp[plane] = s->dst->data[plane];

         frame_data->dst_stride[plane] = s->dst->linesize[plane];


         if (!frame_data->lcount[plane]) {

             frame_data->lcount[plane] = av_calloc(dst_height, sizeof(int32_t) * 16);

             if (!frame_data->lcount[plane])

                 return AVERROR(ENOMEM);

         } else {

             memset(frame_data->lcount[plane], 0, dst_height * sizeof(int32_t) * 16);

         }


         frame_data->field[plane] = field_n;

     }


     if (!frame_data->input) {

         frame_data->input = av_malloc(512 * sizeof(float));

         if (!frame_data->input)

             return AVERROR(ENOMEM);

     }

     // evalfunc_0 requires at least padded_width[0] bytes.

     // evalfunc_1 requires at least 512 floats.

     if (!frame_data->temp) {

         temp_size = FFMAX(frame_data->padded_width[0], 512 * sizeof(float));

         frame_data->temp = av_malloc(temp_size);

         if (!frame_data->temp)

             return AVERROR(ENOMEM);

     }


     // Copy src to a padded "frame" in frame_data and mirror the edges.

     s->copy_pad(src, frame_data, s, field_n);


     // Handles prescreening and the cubic interpolation.

     s->evalfunc_0(s, frame_data);


     // The rest.

     s->evalfunc_1(s, frame_data);


     return 0;

 }


 static int filter_frame(AVFilterLink *inlink, AVFrame *src)

 {

     AVFilterContext *ctx = inlink->dst;

     AVFilterLink *outlink = ctx->outputs[0];

     NNEDIContext *s = ctx->priv;

     int ret;


     if ((s->field > 1 ||

          s->field == -2) && !s->second) {

         goto second;

     } else if (s->field > 1 ||

                s->field == -2) {

         AVFrame *dst;


         s->src = s->second;

         ret = get_frame(ctx, 1);

         if (ret < 0) {

             av_frame_free(&s->dst);

             av_frame_free(&s->src);

             av_frame_free(&s->second);

             return ret;

         }

         dst = s->dst;


         if (src->pts != AV_NOPTS_VALUE &&

             dst->pts != AV_NOPTS_VALUE)

             dst->pts += src->pts;

         else

             dst->pts = AV_NOPTS_VALUE;


         ret = ff_filter_frame(outlink, dst);

         if (ret < 0)

             return ret;

         if (s->eof)

             return 0;

         s->cur_pts = s->second->pts;

         av_frame_free(&s->second);

 second:

         if ((s->deint && src->interlaced_frame &&

              !ctx->is_disabled) ||

             (!s->deint && !ctx->is_disabled)) {

             s->second = src;

         }

     }


     if ((s->deint && !src->interlaced_frame) || ctx->is_disabled) {

         AVFrame *dst = av_frame_clone(src);

         if (!dst) {

             av_frame_free(&src);

             av_frame_free(&s->second);

             return AVERROR(ENOMEM);

         }


         if (s->field > 1 || s->field == -2) {

             av_frame_free(&s->second);

             if ((s->deint && src->interlaced_frame) ||

                 (!s->deint))

                 s->second = src;

         } else {

             av_frame_free(&src);

         }

         if (dst->pts != AV_NOPTS_VALUE)

             dst->pts *= 2;

         return ff_filter_frame(outlink, dst);

     }


     s->src = src;

     ret = get_frame(ctx, 0);

     if (ret < 0) {

         av_frame_free(&s->dst);

         av_frame_free(&s->src);

         av_frame_free(&s->second);

         return ret;

     }


     if (src->pts != AV_NOPTS_VALUE)

         s->dst->pts = src->pts * 2;

     if (s->field <= 1 && s->field > -2) {

         av_frame_free(&src);

         s->src = NULL;

     }


     return ff_filter_frame(outlink, s->dst);

 }


 static int request_frame(AVFilterLink *link)

 {

     AVFilterContext *ctx = link->src;

     NNEDIContext *s = ctx->priv;

     int ret;


     if (s->eof)

         return AVERROR_EOF;


     ret  = ff_request_frame(ctx->inputs[0]);


     if (ret == AVERROR_EOF && s->second) {

         AVFrame *next = av_frame_clone(s->second);


         if (!next)

             return AVERROR(ENOMEM);


         next->pts = s->second->pts * 2 - s->cur_pts;

         s->eof = 1;


         filter_frame(ctx->inputs[0], next);

     } else if (ret < 0) {

         return ret;

     }


     return 0;

 }


 static av_cold int init(AVFilterContext *ctx)

 {

     NNEDIContext *s = ctx->priv;

     FILE *weights_file = NULL;

     int64_t expected_size = 13574928;

     int64_t weights_size;

     float *bdata;

     size_t bytes_read;

     const int xdia_table[NUM_NSIZE] = { 8, 16, 32, 48, 8, 16, 32 };

     const int ydia_table[NUM_NSIZE] = { 6, 6, 6, 6, 4, 4, 4 };

     const int nns_table[NUM_NNS] = { 16, 32, 64, 128, 256 };

     const int dims0 = 49 * 4 + 5 * 4 + 9 * 4;

     const int dims0new = 4 * 65 + 4 * 5;

     const int dims1 = nns_table[s->nnsparam] * 2 * (xdia_table[s->nsize] * ydia_table[s->nsize] + 1);

     int dims1tsize = 0;

     int dims1offset = 0;

     int ret = 0, i, j, k;


     weights_file = fopen(s->weights_file, "rb");

     if (!weights_file) {

         av_log(ctx, AV_LOG_ERROR, "No weights file provided, aborting!\n");

         return AVERROR(EINVAL);

     }


     if (fseek(weights_file, 0, SEEK_END)) {

         av_log(ctx, AV_LOG_ERROR, "Couldn't seek to the end of weights file.\n");

         fclose(weights_file);

         return AVERROR(EINVAL);

     }


     weights_size = ftell(weights_file);


     if (weights_size == -1) {

         fclose(weights_file);

         av_log(ctx, AV_LOG_ERROR, "Couldn't get size of weights file.\n");

         return AVERROR(EINVAL);

     } else if (weights_size != expected_size) {

         fclose(weights_file);

         av_log(ctx, AV_LOG_ERROR, "Unexpected weights file size.\n");

         return AVERROR(EINVAL);

     }


     if (fseek(weights_file, 0, SEEK_SET)) {

         fclose(weights_file);

         av_log(ctx, AV_LOG_ERROR, "Couldn't seek to the start of weights file.\n");

         return AVERROR(EINVAL);

     }


     bdata = (float *)av_malloc(expected_size);

     if (!bdata) {

         fclose(weights_file);

         return AVERROR(ENOMEM);

     }


     bytes_read = fread(bdata, 1, expected_size, weights_file);


     if (bytes_read != (size_t)expected_size) {

         fclose(weights_file);

         ret = AVERROR_INVALIDDATA;

         av_log(ctx, AV_LOG_ERROR, "Couldn't read weights file.\n");

         goto fail;

     }


     fclose(weights_file);


     for (j = 0; j < NUM_NNS; j++) {

         for (i = 0; i < NUM_NSIZE; i++) {

             if (i == s->nsize && j == s->nnsparam)

                 dims1offset = dims1tsize;

             dims1tsize += nns_table[j] * 2 * (xdia_table[i] * ydia_table[i] + 1) * 2;

         }

     }


     s->weights0 = av_malloc_array(FFMAX(dims0, dims0new), sizeof(float));

     if (!s->weights0) {

         ret = AVERROR(ENOMEM);

         goto fail;

     }


     for (i = 0; i < 2; i++) {

         s->weights1[i] = av_malloc_array(dims1, sizeof(float));

         if (!s->weights1[i]) {

             ret = AVERROR(ENOMEM);

             goto fail;

         }

     }


     // Adjust prescreener weights

     if (s->pscrn >= 2) {// using new prescreener

         const float *bdw;

         int16_t *ws;

         float *wf;

         double mean[4] = { 0.0, 0.0, 0.0, 0.0 };

         int *offt = av_calloc(4 * 64, sizeof(int));


         if (!offt) {

             ret = AVERROR(ENOMEM);

             goto fail;

         }


         for (j = 0; j < 4; j++)

             for (k = 0; k < 64; k++)

                 offt[j * 64 + k] = ((k >> 3) << 5) + ((j & 3) << 3) + (k & 7);


         bdw = bdata + dims0 + dims0new * (s->pscrn - 2);

         ws = (int16_t *)s->weights0;

         wf = (float *)&ws[4 * 64];

         // Calculate mean weight of each first layer neuron

         for (j = 0; j < 4; j++) {

             double cmean = 0.0;

             for (k = 0; k < 64; k++)

                 cmean += bdw[offt[j * 64 + k]];

             mean[j] = cmean / 64.0;

         }

         // Factor mean removal and 1.0/127.5 scaling

         // into first layer weights. scale to int16 range

         for (j = 0; j < 4; j++) {

             double scale, mval = 0.0;


             for (k = 0; k < 64; k++)

                 mval = FFMAX(mval, FFABS((bdw[offt[j * 64 + k]] - mean[j]) / 127.5));

             scale = 32767.0 / mval;

             for (k = 0; k < 64; k++)

                 ws[offt[j * 64 + k]] = roundds(((bdw[offt[j * 64 + k]] - mean[j]) / 127.5) * scale);

             wf[j] = (float)(mval / 32767.0);

         }

         memcpy(wf + 4, bdw + 4 * 64, (dims0new - 4 * 64) * sizeof(float));

         av_free(offt);

     } else { // using old prescreener

         double mean[4] = { 0.0, 0.0, 0.0, 0.0 };

         // Calculate mean weight of each first layer neuron

         for (j = 0; j < 4; j++) {

             double cmean = 0.0;

             for (k = 0; k < 48; k++)

                 cmean += bdata[j * 48 + k];

             mean[j] = cmean / 48.0;

         }

         if (s->fapprox & 1) {// use int16 dot products in first layer

             int16_t *ws = (int16_t *)s->weights0;

             float *wf = (float *)&ws[4 * 48];

             // Factor mean removal and 1.0/127.5 scaling

             // into first layer weights. scale to int16 range

             for (j = 0; j < 4; j++) {

                 double scale, mval = 0.0;

                 for (k = 0; k < 48; k++)

                     mval = FFMAX(mval, FFABS((bdata[j * 48 + k] - mean[j]) / 127.5));

                 scale = 32767.0 / mval;

                 for (k = 0; k < 48; k++)

                     ws[j * 48 + k] = roundds(((bdata[j * 48 + k] - mean[j]) / 127.5) * scale);

                 wf[j] = (float)(mval / 32767.0);

             }

             memcpy(wf + 4, bdata + 4 * 48, (dims0 - 4 * 48) * sizeof(float));

         } else {// use float dot products in first layer

             double half = (1 << 8) - 1;


             half /= 2;


             // Factor mean removal and 1.0/half scaling

             // into first layer weights.

             for (j = 0; j < 4; j++)

                 for (k = 0; k < 48; k++)

                     s->weights0[j * 48 + k] = (float)((bdata[j * 48 + k] - mean[j]) / half);

             memcpy(s->weights0 + 4 * 48, bdata + 4 * 48, (dims0 - 4 * 48) * sizeof(float));

         }

     }


     // Adjust prediction weights

     for (i = 0; i < 2; i++) {

         const float *bdataT = bdata + dims0 + dims0new * 3 + dims1tsize * s->etype + dims1offset + i * dims1;

         const int nnst = nns_table[s->nnsparam];

         const int asize = xdia_table[s->nsize] * ydia_table[s->nsize];

         const int boff = nnst * 2 * asize;

         double *mean = (double *)av_calloc(asize + 1 + nnst * 2, sizeof(double));


         if (!mean) {

             ret = AVERROR(ENOMEM);

             goto fail;

         }


         // Calculate mean weight of each neuron (ignore bias)

         for (j = 0; j < nnst * 2; j++) {

             double cmean = 0.0;

             for (k = 0; k < asize; k++)

                 cmean += bdataT[j * asize + k];

             mean[asize + 1 + j] = cmean / (double)asize;

         }

         // Calculate mean softmax neuron

         for (j = 0; j < nnst; j++) {

             for (k = 0; k < asize; k++)

                 mean[k] += bdataT[j * asize + k] - mean[asize + 1 + j];

             mean[asize] += bdataT[boff + j];

         }

         for (j = 0; j < asize + 1; j++)

             mean[j] /= (double)(nnst);


         if (s->fapprox & 2) { // use int16 dot products

             int16_t *ws = (int16_t *)s->weights1[i];

             float *wf = (float *)&ws[nnst * 2 * asize];

             // Factor mean removal into weights, remove global offset from

             // softmax neurons, and scale weights to int16 range.

             for (j = 0; j < nnst; j++) { // softmax neurons

                 double scale, mval = 0.0;

                 for (k = 0; k < asize; k++)

                     mval = FFMAX(mval, FFABS(bdataT[j * asize + k] - mean[asize + 1 + j] - mean[k]));

                 scale = 32767.0 / mval;

                 for (k = 0; k < asize; k++)

                     ws[j * asize + k] = roundds((bdataT[j * asize + k] - mean[asize + 1 + j] - mean[k]) * scale);

                 wf[(j >> 2) * 8 + (j & 3)] = (float)(mval / 32767.0);

                 wf[(j >> 2) * 8 + (j & 3) + 4] = (float)(bdataT[boff + j] - mean[asize]);

             }

             for (j = nnst; j < nnst * 2; j++) { // elliott neurons

                 double scale, mval = 0.0;

                 for (k = 0; k < asize; k++)

                     mval = FFMAX(mval, FFABS(bdataT[j * asize + k] - mean[asize + 1 + j]));

                 scale = 32767.0 / mval;

                 for (k = 0; k < asize; k++)

                     ws[j * asize + k] = roundds((bdataT[j * asize + k] - mean[asize + 1 + j]) * scale);

                 wf[(j >> 2) * 8 + (j & 3)] = (float)(mval / 32767.0);

                 wf[(j >> 2) * 8 + (j & 3) + 4] = bdataT[boff + j];

             }

         } else { // use float dot products

             // Factor mean removal into weights, and remove global

             // offset from softmax neurons.

             for (j = 0; j < nnst * 2; j++) {

                 for (k = 0; k < asize; k++) {

                     const double q = j < nnst ? mean[k] : 0.0;

                     s->weights1[i][j * asize + k] = (float)(bdataT[j * asize + k] - mean[asize + 1 + j] - q);

                 }

                 s->weights1[i][boff + j] = (float)(bdataT[boff + j] - (j < nnst ? mean[asize] : 0.0));

             }

         }

         av_free(mean);

     }


     s->nns = nns_table[s->nnsparam];

     s->xdia = xdia_table[s->nsize];

     s->ydia = ydia_table[s->nsize];

     s->asize = xdia_table[s->nsize] * ydia_table[s->nsize];


     s->max_value = 65535 >> 8;


     select_functions(s);


     s->fdsp = avpriv_float_dsp_alloc(0);

     if (!s->fdsp)

         ret = AVERROR(ENOMEM);


 fail:

     av_free(bdata);

     return ret;

 }


 static av_cold void uninit(AVFilterContext *ctx)

 {

     NNEDIContext *s = ctx->priv;

     int i;


     av_freep(&s->weights0);


     for (i = 0; i < 2; i++)

         av_freep(&s->weights1[i]);


     for (i = 0; i < s->nb_planes; i++) {

         av_freep(&s->frame_data.paddedp[i]);

         av_freep(&s->frame_data.lcount[i]);

     }


     av_freep(&s->frame_data.input);

     av_freep(&s->frame_data.temp);

     av_freep(&s->fdsp);

     av_frame_free(&s->second);

 }


 static const AVFilterPad inputs[] = {

     {

         .name          = "default",

         .type          = AVMEDIA_TYPE_VIDEO,

         .filter_frame  = filter_frame,

         .config_props  = config_input,

     },

     { NULL }

 };


 static const AVFilterPad outputs[] = {

     {

         .name          = "default",

         .type          = AVMEDIA_TYPE_VIDEO,

         .config_props  = config_output,

         .request_frame = request_frame,

     },

     { NULL }

 };


 AVFilter ff_vf_nnedi = {

     .name          = "nnedi",

     .description   = NULL_IF_CONFIG_SMALL("Apply neural network edge directed interpolation intra-only deinterlacer."),

     .priv_size     = sizeof(NNEDIContext),

     .priv_class    = &nnedi_class,

     .init          = init,

     .uninit        = uninit,

     .query_formats = query_formats,

     .inputs        = inputs,

     .outputs       = outputs,

     .flags         = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,

 };

filter_frame
static int filter_frame(AVFilterLink *inlink, AVFrame *src)
Definition: vf_nnedi.c:794

FLAGS
#define FLAGS
Definition: vf_nnedi.c:105

plane
int plane
Definition: avisynth_c.h:422

NNEDIContext::xdia
int xdia
Definition: vf_nnedi.c:70

NULL
#define NULL
Definition: coverity.c:32

NNEDIContext::cur_pts
int64_t cur_pts
Definition: vf_nnedi.c:59

s
const char * s
Definition: avisynth_c.h:768

AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59

av_pix_fmt_desc_get
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2266

chroma
static av_always_inline void chroma(WaveformContext *s, AVFrame *in, AVFrame *out, int component, int intensity, int offset_y, int offset_x, int column, int mirror)
Definition: vf_waveform.c:1323

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:184

AV_PIX_FMT_NONE
Definition: pixfmt.h:61

src_pitch
BYTE int const BYTE int src_pitch
Definition: avisynth_c.h:813

AVOption
AVOption.
Definition: opt.h:245

data
ptrdiff_t const GLvoid * data
Definition: opengl_enc.c:101

config_input
static int config_input(AVFilterLink *inlink)
Definition: vf_nnedi.c:150

AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:67

imgutils.h
misc image utilities

av_pix_fmt_count_planes
int av_pix_fmt_count_planes(enum AVPixelFormat pix_fmt)
Definition: pixdesc.c:2306

avfilter.h
Main libavfilter public API header.

temp
else temp
Definition: vf_mcdeint.c:259

desc
const char * desc
Definition: nvenc.c:101

AV_OPT_TYPE_INT
Definition: opt.h:223

NNEDIContext::weights_file
char * weights_file
Definition: vf_nnedi.c:53

compute_network0_i16
static void compute_network0_i16(NNEDIContext *s, const float *inputf, const float *weightsf, uint8_t *d)
Definition: vf_nnedi.c:314

AVFilterLink::h
int h
agreed upon image height
Definition: avfilter.h:391

AV_PIX_FMT_GBRP
planar GBR 4:4:4 24bpp
Definition: pixfmt.h:180

AVRational::num
int num
Numerator.
Definition: rational.h:59

NNEDIContext::dot_prod
void(* dot_prod)(struct NNEDIContext *, const float *, const float *, float *, const int, const int, const float *)
Definition: vf_nnedi.c:97

float_dsp.h

AVFloatDSPContext::scalarproduct_float
float(* scalarproduct_float)(const float *v1, const float *v2, int len)
Calculate the scalar product of two vectors of floats.
Definition: float_dsp.h:159

NNEDIContext::weights1
float * weights1[2]
Definition: vf_nnedi.c:67

NNEDIContext::second
AVFrame * second
Definition: vf_nnedi.c:56

compute_network0
static void compute_network0(NNEDIContext *s, const float *input, const float *weights, uint8_t *d)
Definition: vf_nnedi.c:297

t8
#define t8
Definition: regdef.h:53

ff_get_video_buffer
AVFrame * ff_get_video_buffer(AVFilterLink *link, int w, int h)
Request a picture buffer with a specific set of permissions.
Definition: video.c:76

NNEDIContext::frame_data
FrameData frame_data
Definition: vf_nnedi.c:101

fn
#define fn(a)
Definition: colorspacedsp_template.c:42

NNEDIContext::max_value
int max_value
Definition: vf_nnedi.c:84

AVFilterContext::is_disabled
int is_disabled
the enabled state from the last expression evaluation
Definition: avfilter.h:354

FrameData::field
int field[3]
Definition: vf_nnedi.c:43

FrameData::temp
float * temp
Definition: vf_nnedi.c:47

av_calloc
void * av_calloc(size_t nmemb, size_t size)
Non-inlined equivalent of av_mallocz_array().
Definition: mem.c:260

ff_make_format_list
AVFilterFormats * ff_make_format_list(const int *fmts)
Create a list of supported formats.
Definition: formats.c:283

dot_prod
static void dot_prod(NNEDIContext *s, const float *data, const float *weights, float *vals, const int n, const int len, const float *scale)
Definition: vf_nnedi.c:268

FrameData::padded_height
int padded_height[3]
Definition: vf_nnedi.c:38

srcp
BYTE int const BYTE * srcp
Definition: avisynth_c.h:813

AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:59

AVFilterContext::inputs
AVFilterLink ** inputs
array of pointers to input links
Definition: avfilter.h:315

FrameData::dst_stride
int dst_stride[3]
Definition: vf_nnedi.c:41

request_frame
static int request_frame(AVFilterLink *link)
Definition: vf_nnedi.c:879

AV_OPT_TYPE_CONST
Definition: opt.h:231

ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1189

elliott
static void elliott(float *data, const int n)
Definition: vf_nnedi.c:260

NUM_NSIZE
#define NUM_NSIZE
Definition: vf_nnedi.c:635

NNEDIContext::evalfunc_0
void(* evalfunc_0)(struct NNEDIContext *, FrameData *)
Definition: vf_nnedi.c:87

uint8_t
uint8_t
Definition: audio_convert.c:194

av_cold
#define av_cold
Definition: attributes.h:82

av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31

opt.h
AVOptions.

FrameData
Definition: vf_nnedi.c:34

NNEDIContext::wae5
void(* wae5)(const float *, const int, float *)
Definition: vf_nnedi.c:99

NNEDIContext::src
AVFrame * src
Definition: vf_nnedi.c:55

outputs
static const AVFilterPad outputs[]
Definition: vf_nnedi.c:1190

AVFrame::pts
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:268

NNEDIContext::process_plane
int process_plane
Definition: vf_nnedi.c:76

NNEDIContext::etype
int etype
Definition: vf_nnedi.c:80

copy_pad
static void copy_pad(const AVFrame *src, FrameData *frame_data, NNEDIContext *s, int fn)
Definition: vf_nnedi.c:204

height
#define height

AV_OPT_TYPE_STRING
Definition: opt.h:227

NNEDIContext::nns
int nns
Definition: vf_nnedi.c:69

AV_PIX_FMT_YUVJ440P
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range...
Definition: pixfmt.h:101

AV_PIX_FMT_YUVJ422P
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
Definition: pixfmt.h:75

AVERROR_EOF
#define AVERROR_EOF
End of file.
Definition: error.h:55

float.h

AVFrame::interlaced_frame
int interlaced_frame
The content of the picture is interlaced.
Definition: frame.h:322

uninit
static av_cold void uninit(AVFilterContext *ctx)
Definition: vf_nnedi.c:1159

video.h

min_weight_sum
const float min_weight_sum
Definition: vf_nnedi.c:560

evalfunc_1
static void evalfunc_1(NNEDIContext *s, FrameData *frame_data)
Definition: vf_nnedi.c:578

roundds
static int roundds(const double f)
Definition: vf_nnedi.c:638

av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28

modnpf
static int modnpf(const int m, const int n)
Definition: vf_nnedi.c:682

NNEDIContext::evalfunc_1
void(* evalfunc_1)(struct NNEDIContext *, FrameData *)
Definition: vf_nnedi.c:88

exp_hi
static const float exp_hi
Definition: vf_nnedi.c:550

AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:53

NNEDIContext::process_line0
int32_t(* process_line0)(const uint8_t *, int, uint8_t *, const uint8_t *, const int, const int, const int)
Definition: vf_nnedi.c:93

AVFilterLink
A link between two filters.
Definition: avfilter.h:380

AVFILTER_DEFINE_CLASS
AVFILTER_DEFINE_CLASS(nnedi)

NNEDIContext::eof
int eof
Definition: vf_nnedi.c:58

OFFSET
#define OFFSET(x)
Definition: vf_nnedi.c:104

AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176

ff_set_common_formats
int ff_set_common_formats(AVFilterContext *ctx, AVFilterFormats *formats)
A helper for query_formats() which sets all links to the same list of formats.
Definition: formats.c:568

AVPixFmtDescriptor::log2_chroma_h
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
Definition: pixdesc.h:101

NNEDIContext::fdsp
AVFloatDSPContext * fdsp
Definition: vf_nnedi.c:61

AVFilterLink::frame_rate
AVRational frame_rate
Frame rate of the stream on the link, or 1/0 if unknown or variable; if left to 0/0, will be automatically copied from the first input of the source filter if it exists.
Definition: avfilter.h:483

mask
static const uint16_t mask[17]
Definition: lzw.c:38

select_functions
static void select_functions(NNEDIContext *s)
Definition: vf_nnedi.c:645

dstp
BYTE * dstp
Definition: avisynth_c.h:813

AVERROR
#define AVERROR(e)
Definition: error.h:43

av_frame_free
void av_frame_free(AVFrame **frame)
Free the frame and any dynamically allocated objects in it, e.g.
Definition: frame.c:158

NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:176

AVFilterContext::priv
void * priv
private data for use by the filter
Definition: avfilter.h:322

NNEDIContext::nsize
int nsize
Definition: vf_nnedi.c:77

AVFilterLink::time_base
AVRational time_base
Define the time base used by the PTS of the frames/samples which will pass through this link...
Definition: avfilter.h:406

FrameData::padded_width
int padded_width[3]
Definition: vf_nnedi.c:37

count
GLsizei count
Definition: opengl_enc.c:109

FFMAX
#define FFMAX(a, b)
Definition: common.h:94

fail
#define fail()
Definition: checkasm.h:83

exp
int8_t exp
Definition: eval.c:64

get_frame
static int get_frame(AVFilterContext *ctx, int is_second)
Definition: vf_nnedi.c:689

NNEDIContext::asize
int asize
Definition: vf_nnedi.c:68

AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:66

FrameData::input
float * input
Definition: vf_nnedi.c:46

AVFilterLink::w
int w
agreed upon image width
Definition: avfilter.h:390

NNEDIContext::qual
int qual
Definition: vf_nnedi.c:79

weighted_avg_elliott_mul5_m16
static void weighted_avg_elliott_mul5_m16(const float *w, const int n, float *mstd)
Definition: vf_nnedi.c:562

query_formats
static int query_formats(AVFilterContext *ctx)
Definition: vf_nnedi.c:184

pixdesc.h

NNEDIContext::ydia
int ydia
Definition: vf_nnedi.c:71

FFMIN
#define FFMIN(a, b)
Definition: common.h:96

NNEDIContext::compute_network0
void(* compute_network0)(struct NNEDIContext *s, const float *, const float *, uint8_t *)
Definition: vf_nnedi.c:92

AV_PIX_FMT_YUVJ420P
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
Definition: pixfmt.h:74

NNEDIContext::nnsparam
int nnsparam
Definition: vf_nnedi.c:78

width
#define width

void
typedef void(APIENTRY *FF_PFNGLACTIVETEXTUREPROC)(GLenum texture)

inputs
static const AVFilterPad inputs[]
Definition: vf_nnedi.c:1180

int32_t
int32_t
Definition: audio_convert.c:194

ctx
AVFormatContext * ctx
Definition: movenc.c:48

ff_vf_nnedi
AVFilter ff_vf_nnedi
Definition: vf_nnedi.c:1200

FFABS
#define FFABS(a)
Absolute value, Note, INT_MIN / INT64_MIN result in undefined behavior as they are not representable ...
Definition: common.h:72

n
int n
Definition: avisynth_c.h:684

FrameData::dstp
uint8_t * dstp[3]
Definition: vf_nnedi.c:40

AVFilterLink::src
AVFilterContext * src
source filter
Definition: avfilter.h:381

AVFloatDSPContext
Definition: float_dsp.h:24

src
#define src
Definition: vp9dsp.c:530

evalfunc_0
static void evalfunc_0(NNEDIContext *s, FrameData *frame_data)
Definition: vf_nnedi.c:418

av_frame_clone
AVFrame * av_frame_clone(const AVFrame *src)
Create a new frame that references the same data as src.
Definition: frame.c:480

AVFilterLink::format
int format
agreed upon media format
Definition: avfilter.h:397

extract_m8
static void extract_m8(const uint8_t *srcp8, const int stride, const int xdia, const int ydia, float *mstd, float *input)
Definition: vf_nnedi.c:487

NNEDIContext::pscrn
int pscrn
Definition: vf_nnedi.c:81

e2_m16
static void e2_m16(float *s, const int n)
Definition: vf_nnedi.c:552

AVFrame::linesize
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Definition: frame.h:215

NNEDIContext::deint
int deint
Definition: vf_nnedi.c:74

AVPixFmtDescriptor
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
Definition: pixdesc.h:81

FrameData::padded_stride
int padded_stride[3]
Definition: vf_nnedi.c:36

AV_PIX_FMT_YUV410P
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
Definition: pixfmt.h:68

AVClass
Describe the class of an AVClass context structure.
Definition: log.h:67

AVFilter
Filter definition.
Definition: avfilter.h:144

av_image_fill_linesizes
int av_image_fill_linesizes(int linesizes[4], enum AVPixelFormat pix_fmt, int width)
Fill plane linesizes for an image with pixel format pix_fmt and width width.
Definition: imgutils.c:88

FrameData::lcount
int32_t * lcount[3]
Definition: vf_nnedi.c:45

AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58

compute_network0new
static void compute_network0new(NNEDIContext *s, const float *datai, const float *weights, uint8_t *d)
Definition: vf_nnedi.c:383

byte2word48
static void byte2word48(const uint8_t *t, const int pitch, float *pf)
Definition: vf_nnedi.c:342

AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:148

pixel2float48
static void pixel2float48(const uint8_t *t8, const int pitch, float *p)
Definition: vf_nnedi.c:332

avpriv_float_dsp_alloc
av_cold AVFloatDSPContext * avpriv_float_dsp_alloc(int bit_exact)
Allocate a float DSP context.
Definition: float_dsp.c:119

NNEDIContext
Definition: vf_nnedi.c:50

NNEDIContext::extract
void(* extract)(const uint8_t *, const int, const int, const int, float *, float *)
Definition: vf_nnedi.c:96

AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
Definition: avfilter.h:133

AVFilterContext::outputs
AVFilterLink ** outputs
array of pointers to output links
Definition: avfilter.h:319

pix_fmts
static enum AVPixelFormat pix_fmts[]
Definition: libkvazaar.c:262

NNEDIContext::dst
AVFrame * dst
Definition: vf_nnedi.c:57

flags
static int flags
Definition: cpu.c:47

AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:198

NNEDIContext::fapprox
int fapprox
Definition: vf_nnedi.c:82

process_line0
static int32_t process_line0(const uint8_t *tempu, int width, uint8_t *dstp8, const uint8_t *src3p8, const int src_pitch, const int max_value, const int chroma)
Definition: vf_nnedi.c:352

stride
GLint GLenum GLboolean GLsizei stride
Definition: opengl_enc.c:105

AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:62

AV_PIX_FMT_GRAY8
Y , 8bpp.
Definition: pixfmt.h:70

common.h
common internal and external API header

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

config_output
static int config_output(AVFilterLink *outlink)
Definition: vf_nnedi.c:167

NUM_NNS
#define NUM_NNS
Definition: vf_nnedi.c:636

AV_PIX_FMT_YUVJ444P
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
Definition: pixfmt.h:76

AV_PIX_FMT_YUV411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
Definition: pixfmt.h:69

AVRational::den
int den
Denominator.
Definition: rational.h:60

NNEDIContext::nb_planes
int nb_planes
Definition: vf_nnedi.c:62

NNEDIContext::readpixels
void(* readpixels)(const uint8_t *, const int, float *)
Definition: vf_nnedi.c:91

NNEDIContext::linesize
int linesize[4]
Definition: vf_nnedi.c:63

NNEDIContext::weights0
float * weights0
Definition: vf_nnedi.c:66

av_free
#define av_free(p)
Definition: tableprint_vlc.h:34

AVFrame::top_field_first
int top_field_first
If the content is interlaced, is top field displayed first.
Definition: frame.h:327

init
static av_cold int init(AVFilterContext *ctx)
Definition: vf_nnedi.c:907

len
int len
Definition: vorbis_enc_data.h:452

byte2word64
static void byte2word64(const uint8_t *t, const int pitch, float *p)
Definition: vf_nnedi.c:373

NNEDIContext::planeheight
int planeheight[4]
Definition: vf_nnedi.c:64

AVFilterLink::dst
AVFilterContext * dst
dest filter
Definition: avfilter.h:384

tmp
static uint8_t tmp[8]
Definition: des.c:38

NNEDIContext::expfunc
void(* expfunc)(float *, const int)
Definition: vf_nnedi.c:98

AVFilterFormats
A list of supported formats for one end of a filter link.
Definition: formats.h:64

AV_PIX_FMT_YUVJ411P
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
Definition: pixfmt.h:272

formats.h

AVFilterContext
An instance of a filter.
Definition: avfilter.h:307

av_mul_q
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
Definition: rational.c:80

nnedi_options
static const AVOption nnedi_options[]
Definition: vf_nnedi.c:107

av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35

FrameData::paddedp
uint8_t * paddedp[3]
Definition: vf_nnedi.c:35

NNEDIContext::field
int field
Definition: vf_nnedi.c:75

AV_PIX_FMT_YUV440P
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
Definition: pixfmt.h:100

AVMEDIA_TYPE_VIDEO
Definition: avutil.h:195

av_malloc_array
#define av_malloc_array(a, b)
Definition: tableprint_vlc.h:32

dot_prods
static void dot_prods(NNEDIContext *s, const float *dataf, const float *weightsf, float *vals, const int n, const int len, const float *scale)
Definition: vf_nnedi.c:281

ff_request_frame
int ff_request_frame(AVFilterLink *link)
Request an input frame from the filter at the other end of the link.
Definition: avfilter.c:369

av_image_copy_plane
void av_image_copy_plane(uint8_t *dst, int dst_linesize, const uint8_t *src, int src_linesize, int bytewidth, int height)
Copy image plane from src to dst.
Definition: imgutils.c:287

internal.h
internal API functions

extract_m8_i16
static void extract_m8_i16(const uint8_t *srcp, const int stride, const int xdia, const int ydia, float *mstd, float *inputf)
Definition: vf_nnedi.c:520

AVPixelFormat
AVPixelFormat
Pixel format.
Definition: pixfmt.h:60

NNEDIContext::copy_pad
void(* copy_pad)(const AVFrame *, FrameData *, struct NNEDIContext *, int)
Definition: vf_nnedi.c:86

for
for(j=16;j >0;--j)
Definition: h264pred_template.c:469

av_frame_copy_props
int av_frame_copy_props(AVFrame *dst, const AVFrame *src)
Copy only "metadata" fields from src to dst.
Definition: frame.c:589

AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:242

exp_lo
static const float exp_lo
Definition: vf_nnedi.c:549

AV_CEIL_RSHIFT
#define AV_CEIL_RSHIFT(a, b)
Definition: common.h:58