67 int jobnr,
int nb_jobs);
71 #define OFFSET(x) offsetof(SSIMContext, x) 72 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_VIDEO_PARAM 85 snprintf(value,
sizeof(value),
"%f", d);
88 snprintf(key2,
sizeof(key2),
"%s%c", key, comp);
96 const uint8_t *ref8, ptrdiff_t ref_stride,
97 int64_t (*sums)[4],
int width)
99 const uint16_t *main16 = (
const uint16_t *)main8;
100 const uint16_t *ref16 = (
const uint16_t *)ref8;
106 for (z = 0; z <
width; z++) {
107 uint64_t
s1 = 0,
s2 = 0,
ss = 0, s12 = 0;
109 for (y = 0; y < 4; y++) {
110 for (x = 0; x < 4; x++) {
111 unsigned a = main16[x + y * main_stride];
112 unsigned b = ref16[x + y * ref_stride];
133 int (*sums)[4],
int width)
137 for (z = 0; z <
width; z++) {
138 uint32_t
s1 = 0,
s2 = 0,
ss = 0, s12 = 0;
140 for (y = 0; y < 4; y++) {
141 for (x = 0; x < 4; x++) {
142 int a = main[x + y * main_stride];
143 int b = ref[x + y * ref_stride];
164 int64_t ssim_c1 = (int64_t)(.01*.01*max*max*64 + .5);
165 int64_t ssim_c2 = (int64_t)(.03*.03*max*max*64*63 + .5);
171 int64_t
vars = fss * 64 - fs1 * fs1 - fs2 * fs2;
172 int64_t covar = fs12 * 64 - fs1 * fs2;
174 return (
float)(2 * fs1 * fs2 + ssim_c1) * (
float)(2 * covar + ssim_c2)
175 / ((
float)(fs1 * fs1 + fs2 * fs2 + ssim_c1) * (
float)(vars + ssim_c2));
180 static const int ssim_c1 = (
int)(.01*.01*255*255*64 + .5);
181 static const int ssim_c2 = (
int)(.03*.03*255*255*64*63 + .5);
187 int vars = fss * 64 - fs1 * fs1 - fs2 * fs2;
188 int covar = fs12 * 64 - fs1 * fs2;
190 return (
float)(2 * fs1 * fs2 + ssim_c1) * (
float)(2 * covar + ssim_c2)
191 / ((
float)(fs1 * fs1 + fs2 * fs2 + ssim_c1) * (
float)(vars + ssim_c2));
199 for (i = 0; i <
width; i++)
200 ssim +=
ssim_end1x(sum0[i][0] + sum0[i + 1][0] + sum1[i][0] + sum1[i + 1][0],
201 sum0[i][1] + sum0[i + 1][1] + sum1[i][1] + sum1[i + 1][1],
202 sum0[i][2] + sum0[i + 1][2] + sum1[i][2] + sum1[i + 1][2],
203 sum0[i][3] + sum0[i + 1][3] + sum1[i][3] + sum1[i + 1][3],
213 for (i = 0; i <
width; i++)
214 ssim +=
ssim_end1(sum0[i][0] + sum0[i + 1][0] + sum1[i][0] + sum1[i + 1][0],
215 sum0[i][1] + sum0[i + 1][1] + sum1[i][1] + sum1[i + 1][1],
216 sum0[i][2] + sum0[i + 1][2] + sum1[i][2] + sum1[i + 1][2],
217 sum0[i][3] + sum0[i + 1][3] + sum1[i][3] + sum1[i + 1][3]);
221 #define SUM_LEN(w) (((w) >> 2) + 3) 226 int main_linesize[4];
238 int jobnr,
int nb_jobs)
252 const int slice_start = ((height >> 2) * jobnr) / nb_jobs;
253 const int slice_end = ((height >> 2) * (jobnr+1)) / nb_jobs;
254 const int ystart =
FFMAX(1, slice_start);
257 int64_t (*sum0)[4] =
temp;
258 int64_t (*sum1)[4] = sum0 +
SUM_LEN(width);
263 for (
int y = ystart; y <
slice_end; y++) {
264 for (; z <= y; z++) {
265 FFSWAP(
void*, sum0, sum1);
267 &ref_data[4 * z * ref_stride], ref_stride,
271 ssim +=
ssim_endn_16bit((
const int64_t (*)[4])sum0, (
const int64_t (*)[4])sum1, width - 1, max);
281 int jobnr,
int nb_jobs)
295 const int slice_start = ((height >> 2) * jobnr) / nb_jobs;
296 const int slice_end = ((height >> 2) * (jobnr+1)) / nb_jobs;
297 const int ystart =
FFMAX(1, slice_start);
306 for (
int y = ystart; y <
slice_end; y++) {
307 for (; z <= y; z++) {
308 FFSWAP(
void*, sum0, sum1);
309 dsp->
ssim_4x4_line(&main_data[4 * z * main_stride], main_stride,
310 &ref_data[4 * z * ref_stride], ref_stride,
314 ssim += dsp->
ssim_end_line((
const int (*)[4])sum0, (
const int (*)[4])sum1, width - 1);
325 return (
fabs(weight - ssim) > 1e-9) ? 10.0 * log10(weight / (weight - ssim)) :
INFINITY;
334 double c[4] = {0}, ssimv = 0.0;
366 c[i] += s->
score[j][i];
381 set_meta(metadata,
"lavfi.ssim.All", 0, ssimv);
432 #define PF(suf) AV_PIX_FMT_YUV420##suf, AV_PIX_FMT_YUV422##suf, AV_PIX_FMT_YUV444##suf, AV_PIX_FMT_GBR##suf 518 outlink->
w = mainlink->
w;
519 outlink->
h = mainlink->
h;
531 av_log(ctx,
AV_LOG_WARNING,
"not matching timebases found between first input: %d/%d and second input %d/%d, results may be incorrect!\n",
599 .preinit = ssim_framesync_preinit,
605 .priv_class = &ssim_class,
const uint8_t * ref_data[4]
const AVPixFmtDescriptor * av_pix_fmt_desc_get(enum AVPixelFormat pix_fmt)
This structure describes decoded (raw) audio or video data.
static av_cold void uninit(AVFilterContext *ctx)
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
#define AV_LOG_WARNING
Something somehow does not look correct.
Main libavfilter public API header.
static int ssim_plane_16bit(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
int h
agreed upon image height
static double ssim_endn_8bit(const int(*sum0)[4], const int(*sum1)[4], int width)
The reader does not expect b to be semantically here and if the code is changed by maybe adding a a division or other the signedness will almost certainly be mistaken To avoid this confusion a new type was SUINT is the C unsigned type but it holds a signed int to use the same example SUINT a
int ff_framesync_configure(FFFrameSync *fs)
Configure a frame sync structure.
static void ssim_4x4xn_8bit(const uint8_t *main, ptrdiff_t main_stride, const uint8_t *ref, ptrdiff_t ref_stride, int(*sums)[4], int width)
int is_disabled
the enabled state from the last expression evaluation
uint8_t log2_chroma_w
Amount to shift the luma width right to find the chroma width.
void * av_calloc(size_t nmemb, size_t size)
Non-inlined equivalent of av_mallocz_array().
#define AV_PIX_FMT_GRAY10
const char * name
Pad name.
AVFilterContext * parent
Parent filter context.
#define AV_PIX_FMT_GRAY12
FRAMESYNC_DEFINE_CLASS(ssim, SSIMContext, fs)
AVFilterLink ** inputs
array of pointers to input links
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
int(* ssim_plane)(AVFilterContext *ctx, void *arg, int jobnr, int nb_jobs)
static av_cold int init(AVFilterContext *ctx)
double(* ssim_end_line)(const int(*sum0)[4], const int(*sum1)[4], int w)
AVComponentDescriptor comp[4]
Parameters that describe how pixels are packed.
int ff_framesync_init_dualinput(FFFrameSync *fs, AVFilterContext *parent)
Initialize a frame sync structure for dualinput.
static const AVFilterPad ssim_inputs[]
Undefined Behavior In the C some operations are like signed integer dereferencing freed accessing outside allocated Undefined Behavior must not occur in a C it is not safe even if the output of undefined operations is unused The unsafety may seem nit picking but Optimizing compilers have in fact optimized code on the assumption that no undefined Behavior occurs Optimizing code based on wrong assumptions can and has in some cases lead to effects beyond the output of computations The signed integer overflow problem in speed critical code Code which is highly optimized and works with signed integers sometimes has the problem that often the output of the computation does not c
int ff_framesync_dualinput_get(FFFrameSync *fs, AVFrame **f0, AVFrame **f1)
GLsizei GLboolean const GLfloat * value
static void ssim_4x4xn_16bit(const uint8_t *main8, ptrdiff_t main_stride, const uint8_t *ref8, ptrdiff_t ref_stride, int64_t(*sums)[4], int width)
planar YUV 4:4:0 full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV440P and setting color_range...
planar YUV 4:2:2, 16bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV422P and setting col...
AVDictionary * metadata
metadata.
static float ssim_end1(int s1, int s2, int ss, int s12)
A filter pad used for either input or output.
A link between two filters.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
uint8_t log2_chroma_h
Amount to shift the luma height right to find the chroma height.
void ff_framesync_uninit(FFFrameSync *fs)
Free all memory currently allocated.
AVRational frame_rate
Frame rate of the stream on the link, or 1/0 if unknown or variable; if left to 0/0, will be automatically copied from the first input of the source filter if it exists.
static __device__ float fabs(float a)
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
void ff_ssim_init_x86(SSIMDSPContext *dsp)
void * priv
private data for use by the filter
#define AVFILTER_FLAG_SLICE_THREADS
The filter supports multithreading by splitting frames into multiple parts and processing them concur...
AVRational time_base
Define the time base used by the PTS of the frames/samples which will pass through this link...
int ff_framesync_activate(FFFrameSync *fs)
Examine the frames in the filter's input and try to produce output.
int(* on_event)(struct FFFrameSync *fs)
Callback called when a frame event is ready.
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
int w
agreed upon image width
#define ss(width, name, subs,...)
uint8_t nb_components
The number of components each pixel has, (1-4)
int ff_filter_get_nb_threads(AVFilterContext *ctx)
Get number of threads for current filter instance.
#define AV_PIX_FMT_GRAY16
planar YUV 4:2:0, 12bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV420P and setting col...
AVRational time_base
Time base for the output events.
AVFilterContext * src
source filter
int main(int argc, char *argv[])
static const AVFilterPad outputs[]
int format
agreed upon media format
int ff_fill_rgba_map(uint8_t *rgba_map, enum AVPixelFormat pix_fmt)
static void comp(unsigned char *dst, ptrdiff_t dst_stride, unsigned char *src, ptrdiff_t src_stride, int add)
static const AVOption ssim_options[]
static const uint8_t vars[2][12]
#define AV_LOG_INFO
Standard information.
Used for passing data between threads.
int linesize[AV_NUM_DATA_POINTERS]
For video, size in bytes of each picture line.
Descriptor that unambiguously describes how the bits of a pixel are stored in the up to 4 data planes...
#define AV_PIX_FMT_GRAY14
these buffered frames must be flushed immediately if a new input produces new the filter must not call request_frame to get more It must just process the frame or queue it The task of requesting more frames is left to the filter s request_frame method or the application If a filter has several inputs
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
planar YUV 4:1:0, 9bpp, (1 Cr & Cb sample per 4x4 Y samples)
static int config_input_ref(AVFilterLink *inlink)
Describe the class of an AVClass context structure.
size_t av_strlcatf(char *dst, size_t size, const char *fmt,...)
const char * name
Filter name.
AVRational sample_aspect_ratio
agreed upon sample aspect ratio
#define AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL
Same as AVFILTER_FLAG_SUPPORT_TIMELINE_GENERIC, except that the filter will have its filter_frame() c...
AVFilterLink ** outputs
array of pointers to output links
static int weight(int i, int blen, int offset)
static enum AVPixelFormat pix_fmts[]
#define flags(name, subs,...)
AVFilterInternal * internal
An opaque struct for libavfilter internal use.
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
int av_strerror(int errnum, char *errbuf, size_t errbuf_size)
Put a description of the AVERROR code errnum in errbuf.
static double ssim_db(double ssim, double weight)
The exact code depends on how similar the blocks are and how related they are to the and needs to apply these operations to the correct inlink or outlink if there are several Macros are available to factor that when no extra processing is inlink
static int av_cmp_q(AVRational a, AVRational b)
Compare two rationals.
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
static int activate(AVFilterContext *ctx)
static int ref[MAX_W *MAX_W]
planar YUV 4:4:4, 24bpp, full scale (JPEG), deprecated in favor of AV_PIX_FMT_YUV444P and setting col...
static int config_output(AVFilterLink *outlink)
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples)
avfilter_execute_func * execute
static int slice_end(AVCodecContext *avctx, AVFrame *pict)
Handle slice ends.
static float ssim_endn_16bit(const int64_t(*sum0)[4], const int64_t(*sum1)[4], int width, int max)
static float ssim_end1x(int64_t s1, int64_t s2, int64_t ss, int64_t s12, int max)
static const AVFilterPad ssim_outputs[]
void(* ssim_4x4_line)(const uint8_t *buf, ptrdiff_t buf_stride, const uint8_t *ref, ptrdiff_t ref_stride, int(*sums)[4], int w)
AVFilterContext * dst
dest filter
planar YUV 4:1:1, 12bpp, (1 Cr & Cb sample per 4x1 Y samples) full scale (JPEG), deprecated in favor ...
static int query_formats(AVFilterContext *ctx)
const uint8_t * main_data[4]
planar YUV 4:4:0 (1 Cr & Cb sample per 1x2 Y samples)
#define FFSWAP(type, a, b)
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Frame references ownership and permissions
int depth
Number of bits in the component.
static int do_ssim(FFFrameSync *fs)
static void set_meta(AVDictionary **metadata, const char *key, char comp, float d)
AVPixelFormat
Pixel format.
void * av_mallocz_array(size_t nmemb, size_t size)
#define AV_CEIL_RSHIFT(a, b)