doxygen/3.1/af__silencedetect_8c_source.html

 /*

  * Copyright (c) 2012 Clément Bœsch <u pkh me>

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 /**

  * @file

  * Audio silence detector

  */


 #include <float.h> /* DBL_MAX */


 #include "libavutil/opt.h"

 #include "libavutil/timestamp.h"

 #include "audio.h"

 #include "formats.h"

 #include "avfilter.h"

 #include "internal.h"


 typedef struct SilenceDetectContext {

     const AVClass *class;

     double noise;               ///< noise amplitude ratio

     double duration;            ///< minimum duration of silence until notification

     int64_t nb_null_samples;    ///< current number of continuous zero samples

     int64_t start;              ///< if silence is detected, this value contains the time of the first zero sample

     int last_sample_rate;       ///< last sample rate to check for sample rate changes


     void (*silencedetect)(struct SilenceDetectContext *s, AVFrame *insamples,

                           int nb_samples, int64_t nb_samples_notify,

                           AVRational time_base);

 } SilenceDetectContext;


 #define OFFSET(x) offsetof(SilenceDetectContext, x)

 #define FLAGS AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_AUDIO_PARAM

 static const AVOption silencedetect_options[] = {

     { "n",         "set noise tolerance",              OFFSET(noise),     AV_OPT_TYPE_DOUBLE, {.dbl=0.001},          0, DBL_MAX,  FLAGS },

     { "noise",     "set noise tolerance",              OFFSET(noise),     AV_OPT_TYPE_DOUBLE, {.dbl=0.001},          0, DBL_MAX,  FLAGS },

     { "d",         "set minimum duration in seconds",  OFFSET(duration),  AV_OPT_TYPE_DOUBLE, {.dbl=2.},             0, 24*60*60, FLAGS },

     { "duration",  "set minimum duration in seconds",  OFFSET(duration),  AV_OPT_TYPE_DOUBLE, {.dbl=2.},             0, 24*60*60, FLAGS },

     { NULL }

 };


 AVFILTER_DEFINE_CLASS(silencedetect);


 static char *get_metadata_val(AVFrame *insamples, const char *key)

 {

     AVDictionaryEntry *e = av_dict_get(insamples->metadata, key, NULL, 0);

     return e && e->value ? e->value : NULL;

 }


 static av_always_inline void update(SilenceDetectContext *s, AVFrame *insamples,

                                     int is_silence, int64_t nb_samples_notify,

                                     AVRational time_base)

 {

     if (is_silence) {

         if (!s->start) {

             s->nb_null_samples++;

             if (s->nb_null_samples >= nb_samples_notify) {

                 s->start = insamples->pts - (int64_t)(s->duration / av_q2d(time_base) + .5);

                 av_dict_set(&insamples->metadata, "lavfi.silence_start",

                             av_ts2timestr(s->start, &time_base), 0);

                 av_log(s, AV_LOG_INFO, "silence_start: %s\n",

                        get_metadata_val(insamples, "lavfi.silence_start"));

             }

         }

     } else {

         if (s->start) {

             av_dict_set(&insamples->metadata, "lavfi.silence_end",

                         av_ts2timestr(insamples->pts, &time_base), 0);

             av_dict_set(&insamples->metadata, "lavfi.silence_duration",

                         av_ts2timestr(insamples->pts - s->start, &time_base), 0);

             av_log(s, AV_LOG_INFO,

                    "silence_end: %s | silence_duration: %s\n",

                    get_metadata_val(insamples, "lavfi.silence_end"),

                    get_metadata_val(insamples, "lavfi.silence_duration"));

         }

         s->nb_null_samples = s->start = 0;

     }

 }


 #define SILENCE_DETECT(name, type)                                               \

 static void silencedetect_##name(SilenceDetectContext *s, AVFrame *insamples,    \

                                  int nb_samples, int64_t nb_samples_notify,      \

                                  AVRational time_base)                           \

 {                                                                                \

     const type *p = (const type *)insamples->data[0];                            \

     const type noise = s->noise;                                                 \

     int i;                                                                       \

                                                                                  \

     for (i = 0; i < nb_samples; i++, p++)                                        \

         update(s, insamples, *p < noise && *p > -noise,                          \

                nb_samples_notify, time_base);                                    \

 }


 SILENCE_DETECT(dbl, double)

 SILENCE_DETECT(flt, float)

 SILENCE_DETECT(s32, int32_t)

 SILENCE_DETECT(s16, int16_t)


 static int config_input(AVFilterLink *inlink)

 {

     AVFilterContext *ctx = inlink->dst;

     SilenceDetectContext *s = ctx->priv;


     switch (inlink->format) {

     case AV_SAMPLE_FMT_DBL: s->silencedetect = silencedetect_dbl; break;

     case AV_SAMPLE_FMT_FLT: s->silencedetect = silencedetect_flt; break;

     case AV_SAMPLE_FMT_S32:

         s->noise *= INT32_MAX;

         s->silencedetect = silencedetect_s32;

         break;

     case AV_SAMPLE_FMT_S16:

         s->noise *= INT16_MAX;

         s->silencedetect = silencedetect_s16;

         break;

     }


     return 0;

 }


 static int filter_frame(AVFilterLink *inlink, AVFrame *insamples)

 {

     SilenceDetectContext *s         = inlink->dst->priv;

     const int nb_channels           = inlink->channels;

     const int srate                 = inlink->sample_rate;

     const int nb_samples            = insamples->nb_samples     * nb_channels;

     const int64_t nb_samples_notify = srate * s->duration * nb_channels;


     // scale number of null samples to the new sample rate

     if (s->last_sample_rate && s->last_sample_rate != srate)

         s->nb_null_samples = srate * s->nb_null_samples / s->last_sample_rate;

     s->last_sample_rate = srate;


     // TODO: document metadata

     s->silencedetect(s, insamples, nb_samples, nb_samples_notify,

                      inlink->time_base);


     return ff_filter_frame(inlink->dst->outputs[0], insamples);

 }


 static int query_formats(AVFilterContext *ctx)

 {

     AVFilterFormats *formats = NULL;

     AVFilterChannelLayouts *layouts = NULL;

     static const enum AVSampleFormat sample_fmts[] = {

         AV_SAMPLE_FMT_DBL,

         AV_SAMPLE_FMT_FLT,

         AV_SAMPLE_FMT_S32,

         AV_SAMPLE_FMT_S16,

         AV_SAMPLE_FMT_NONE

     };

     int ret;


     layouts = ff_all_channel_layouts();

     if (!layouts)

         return AVERROR(ENOMEM);

     ret = ff_set_common_channel_layouts(ctx, layouts);

     if (ret < 0)

         return ret;


     formats = ff_make_format_list(sample_fmts);

     if (!formats)

         return AVERROR(ENOMEM);

     ret = ff_set_common_formats(ctx, formats);

     if (ret < 0)

         return ret;


     formats = ff_all_samplerates();

     if (!formats)

         return AVERROR(ENOMEM);

     return ff_set_common_samplerates(ctx, formats);

 }


 static const AVFilterPad silencedetect_inputs[] = {

     {

         .name         = "default",

         .type         = AVMEDIA_TYPE_AUDIO,

         .config_props = config_input,

         .filter_frame = filter_frame,

     },

     { NULL }

 };


 static const AVFilterPad silencedetect_outputs[] = {

     {

         .name = "default",

         .type = AVMEDIA_TYPE_AUDIO,

     },

     { NULL }

 };


 AVFilter ff_af_silencedetect = {

     .name          = "silencedetect",

     .description   = NULL_IF_CONFIG_SMALL("Detect silence."),

     .priv_size     = sizeof(SilenceDetectContext),

     .query_formats = query_formats,

     .inputs        = silencedetect_inputs,

     .outputs       = silencedetect_outputs,

     .priv_class    = &silencedetect_class,

 };

NULL
#define NULL
Definition: coverity.c:32

ff_set_common_channel_layouts
int ff_set_common_channel_layouts(AVFilterContext *ctx, AVFilterChannelLayouts *layouts)
A helper for query_formats() which sets all links to the same list of channel layouts/sample rates...
Definition: formats.c:549

s
const char * s
Definition: avisynth_c.h:631

audio.h

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:184

AVDictionaryEntry
Definition: dict.h:85

noise
static int noise(AVBSFContext *ctx, AVPacket *out)
Definition: noise_bsf.c:37

AVOption
AVOption.
Definition: opt.h:245

avfilter.h
Main libavfilter public API header.

AV_SAMPLE_FMT_NONE
Definition: samplefmt.h:59

formats
static enum AVSampleFormat formats[]
Definition: avresample.c:163

AV_SAMPLE_FMT_FLT
float
Definition: samplefmt.h:63

SILENCE_DETECT
#define SILENCE_DETECT(name, type)
Definition: af_silencedetect.c:96

ff_af_silencedetect
AVFilter ff_af_silencedetect
Definition: af_silencedetect.c:207

ff_make_format_list
AVFilterFormats * ff_make_format_list(const int *fmts)
Create a list of supported formats.
Definition: formats.c:283

AVFilterPad::name
const char * name
Pad name.
Definition: internal.h:59

filter_frame
static int filter_frame(AVFilterLink *inlink, AVFrame *insamples)
Definition: af_silencedetect.c:136

ff_filter_frame
int ff_filter_frame(AVFilterLink *link, AVFrame *frame)
Send a frame of data to the next filter.
Definition: avfilter.c:1180

opt.h
AVOptions.

timestamp.h
timestamp utils, mostly useful for debugging/logging purposes

silencedetect_inputs
static const AVFilterPad silencedetect_inputs[]
Definition: af_silencedetect.c:189

SilenceDetectContext::duration
double duration
minimum duration of silence until notification
Definition: af_silencedetect.c:38

AVFrame::pts
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:268

OFFSET
#define OFFSET(x)
Definition: af_silencedetect.c:48

duration
int64_t duration
Definition: movenc.c:63

av_q2d
static double av_q2d(AVRational a)
Convert rational to double.
Definition: rational.h:80

av_dict_get
AVDictionaryEntry * av_dict_get(const AVDictionary *m, const char *key, const AVDictionaryEntry *prev, int flags)
Get a dictionary entry with matching key.
Definition: dict.c:39

float.h

AVFrame::metadata
AVDictionary * metadata
metadata.
Definition: frame.h:471

AV_SAMPLE_FMT_S32
signed 32 bits
Definition: samplefmt.h:62

av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28

AVFilterPad
A filter pad used for either input or output.
Definition: internal.h:53

get_metadata_val
static char * get_metadata_val(AVFrame *insamples, const char *key)
Definition: af_silencedetect.c:60

AVFilterLink
A link between two filters.
Definition: avfilter.h:371

ff_set_common_formats
int ff_set_common_formats(AVFilterContext *ctx, AVFilterFormats *formats)
A helper for query_formats() which sets all links to the same list of formats.
Definition: formats.c:568

AVFilterLink::sample_rate
int sample_rate
samples per second
Definition: avfilter.h:386

silencedetect_outputs
static const AVFilterPad silencedetect_outputs[]
Definition: af_silencedetect.c:199

AVERROR
#define AVERROR(e)
Definition: error.h:43

FLAGS
#define FLAGS
Definition: af_silencedetect.c:49

av_ts2timestr
#define av_ts2timestr(ts, tb)
Convenience macro, the return value should be used only directly in function arguments but never stan...
Definition: timestamp.h:76

NULL_IF_CONFIG_SMALL
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
Definition: internal.h:176

AVFilterContext::priv
void * priv
private data for use by the filter
Definition: avfilter.h:320

AVMEDIA_TYPE_AUDIO
Definition: avutil.h:194

AVFilterLink::time_base
AVRational time_base
Define the time base used by the PTS of the frames/samples which will pass through this link...
Definition: avfilter.h:397

SilenceDetectContext::start
int64_t start
if silence is detected, this value contains the time of the first zero sample
Definition: af_silencedetect.c:40

update
static av_always_inline void update(SilenceDetectContext *s, AVFrame *insamples, int is_silence, int64_t nb_samples_notify, AVRational time_base)
Definition: af_silencedetect.c:66

SilenceDetectContext::noise
double noise
noise amplitude ratio
Definition: af_silencedetect.c:37

void
typedef void(APIENTRY *FF_PFNGLACTIVETEXTUREPROC)(GLenum texture)

config_input
static int config_input(AVFilterLink *inlink)
Definition: af_silencedetect.c:115

int32_t
int32_t
Definition: audio_convert.c:194

ctx
AVFormatContext * ctx
Definition: movenc.c:48

AV_SAMPLE_FMT_DBL
double
Definition: samplefmt.h:64

outputs
static const AVFilterPad outputs[]
Definition: af_afftfilt.c:386

ff_all_channel_layouts
AVFilterChannelLayouts * ff_all_channel_layouts(void)
Construct an empty AVFilterChannelLayouts/AVFilterFormats struct – representing any channel layout (w...
Definition: formats.c:401

AVFilterChannelLayouts
A list of supported channel layouts.
Definition: formats.h:85

AV_LOG_INFO
#define AV_LOG_INFO
Standard information.
Definition: log.h:187

inputs
static const AVFilterPad inputs[]
Definition: af_afftfilt.c:376

AV_OPT_TYPE_DOUBLE
Definition: opt.h:225

AVSampleFormat
AVSampleFormat
Audio sample formats.
Definition: samplefmt.h:58

av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:69

AVFILTER_DEFINE_CLASS
AVFILTER_DEFINE_CLASS(silencedetect)

AVClass
Describe the class of an AVClass context structure.
Definition: log.h:67

AVFilter
Filter definition.
Definition: avfilter.h:142

AVRational
rational number numerator/denominator
Definition: rational.h:43

query_formats
static int query_formats(AVFilterContext *ctx)
Definition: af_silencedetect.c:156

AVFilter::name
const char * name
Filter name.
Definition: avfilter.h:146

AVFilterContext::outputs
AVFilterLink ** outputs
array of pointers to output links
Definition: avfilter.h:317

layouts
enum MovChannelLayoutTag * layouts
Definition: mov_chan.c:434

SilenceDetectContext
Definition: af_silencedetect.c:35

ff_all_samplerates
AVFilterFormats * ff_all_samplerates(void)
Definition: formats.c:395

SilenceDetectContext::silencedetect
void(* silencedetect)(struct SilenceDetectContext *s, AVFrame *insamples, int nb_samples, int64_t nb_samples_notify, AVRational time_base)
Definition: af_silencedetect.c:43

AV_SAMPLE_FMT_S16
signed 16 bits
Definition: samplefmt.h:61

AVFilterLink::channels
int channels
Number of channels.
Definition: avfilter.h:523

SilenceDetectContext::nb_null_samples
int64_t nb_null_samples
current number of continuous zero samples
Definition: af_silencedetect.c:39

silencedetect_options
static const AVOption silencedetect_options[]
Definition: af_silencedetect.c:50

AVDictionaryEntry::value
char * value
Definition: dict.h:87

AVFilterLink::dst
AVFilterContext * dst
dest filter
Definition: avfilter.h:375

AVFilterFormats
A list of supported formats for one end of a filter link.
Definition: formats.h:64

formats.h

AVFilterContext
An instance of a filter.
Definition: avfilter.h:305

sample_fmts
static enum AVSampleFormat sample_fmts[]
Definition: adpcmenc.c:701

av_always_inline
#define av_always_inline
Definition: attributes.h:39

nb_channels
int nb_channels
Definition: channel_layout.c:76

SilenceDetectContext::last_sample_rate
int last_sample_rate
last sample rate to check for sample rate changes
Definition: af_silencedetect.c:41

internal.h
internal API functions

AVFrame::nb_samples
int nb_samples
number of audio samples (per channel) described by this frame
Definition: frame.h:241

ff_set_common_samplerates
int ff_set_common_samplerates(AVFilterContext *ctx, AVFilterFormats *samplerates)
Definition: formats.c:556