doxygen/3.4/opusenc__psy_8c_source.html

 /*

  * Opus encoder

  * Copyright (c) 2017 Rostislav Pehlivanov <atomnuker@gmail.com>

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 #include "opusenc_psy.h"

 #include "opus_pvq.h"

 #include "opustab.h"

 #include "mdct15.h"

 #include "libavutil/qsort.h"


 /* Populate metrics without taking into consideration neighbouring steps */

 static void step_collect_psy_metrics(OpusPsyContext *s, int index)

 {

     int silence = 0, ch, i, j;

     OpusPsyStep *st = s->steps[index];


     st->index = index;


     for (ch = 0; ch < s->avctx->channels; ch++) {

         const int lap_size = (1 << s->bsize_analysis);

         for (i = 1; i <= FFMIN(lap_size, index); i++) {

             const int offset = i*120;

             AVFrame *cur = ff_bufqueue_peek(s->bufqueue, index - i);

             memcpy(&s->scratch[offset], cur->extended_data[ch], cur->nb_samples*sizeof(float));

         }

         for (i = 0; i < lap_size; i++) {

             const int offset = i*120 + lap_size;

             AVFrame *cur = ff_bufqueue_peek(s->bufqueue, index + i);

             memcpy(&s->scratch[offset], cur->extended_data[ch], cur->nb_samples*sizeof(float));

         }


         s->dsp->vector_fmul(s->scratch, s->scratch, s->window[s->bsize_analysis],

                             (OPUS_BLOCK_SIZE(s->bsize_analysis) << 1));


         s->mdct[s->bsize_analysis]->mdct(s->mdct[s->bsize_analysis], st->coeffs[ch], s->scratch, 1);


         for (i = 0; i < CELT_MAX_BANDS; i++)

             st->bands[ch][i] = &st->coeffs[ch][ff_celt_freq_bands[i] << s->bsize_analysis];

     }


     for (ch = 0; ch < s->avctx->channels; ch++) {

         for (i = 0; i < CELT_MAX_BANDS; i++) {

             float avg_c_s, energy = 0.0f, dist_dev = 0.0f;

             const int range = ff_celt_freq_range[i] << s->bsize_analysis;

             const float *coeffs = st->bands[ch][i];

             for (j = 0; j < range; j++)

                 energy += coeffs[j]*coeffs[j];


             st->energy[ch][i] += sqrtf(energy);

             silence |= !!st->energy[ch][i];

             avg_c_s = energy / range;


             for (j = 0; j < range; j++) {

                 const float c_s = coeffs[j]*coeffs[j];

                 dist_dev = (avg_c_s - c_s)*(avg_c_s - c_s);

             }


             st->tone[ch][i] += sqrtf(dist_dev);

         }

     }


     st->silence = !silence;


     if (s->avctx->channels > 1) {

         for (i = 0; i < CELT_MAX_BANDS; i++) {

             float incompat = 0.0f;

             const float *coeffs1 = st->bands[0][i];

             const float *coeffs2 = st->bands[1][i];

             const int range = ff_celt_freq_range[i] << s->bsize_analysis;

             for (j = 0; j < range; j++)

                 incompat += (coeffs1[j] - coeffs2[j])*(coeffs1[j] - coeffs2[j]);

             st->stereo[i] = sqrtf(incompat);

         }

     }


     for (ch = 0; ch < s->avctx->channels; ch++) {

         for (i = 0; i < CELT_MAX_BANDS; i++) {

             OpusBandExcitation *ex = &s->ex[ch][i];

             float bp_e = bessel_filter(&s->bfilter_lo[ch][i], st->energy[ch][i]);

             bp_e = bessel_filter(&s->bfilter_hi[ch][i], bp_e);

             bp_e *= bp_e;

             if (bp_e > ex->excitation) {

                 st->change_amp[ch][i] = bp_e - ex->excitation;

                 st->total_change += st->change_amp[ch][i];

                 ex->excitation = ex->excitation_init = bp_e;

                 ex->excitation_dist = 0.0f;

             }

             if (ex->excitation > 0.0f) {

                 ex->excitation -= av_clipf((1/expf(ex->excitation_dist)), ex->excitation_init/20, ex->excitation_init/1.09);

                 ex->excitation = FFMAX(ex->excitation, 0.0f);

                 ex->excitation_dist += 1.0f;

             }

         }

     }

 }


 static void search_for_change_points(OpusPsyContext *s, float tgt_change,

                                      int offset_s, int offset_e, int resolution,

                                      int level)

 {

     int i;

     float c_change = 0.0f;

     if ((offset_e - offset_s) <= resolution)

         return;

     for (i = offset_s; i < offset_e; i++) {

         c_change += s->steps[i]->total_change;

         if (c_change > tgt_change)

             break;

     }

     if (i == offset_e)

         return;

     search_for_change_points(s, tgt_change / 2.0f, offset_s, i + 0, resolution, level + 1);

     s->inflection_points[s->inflection_points_count++] = i;

     search_for_change_points(s, tgt_change / 2.0f, i + 1, offset_e, resolution, level + 1);

 }


 static int flush_silent_frames(OpusPsyContext *s)

 {

     int fsize, silent_frames;


     for (silent_frames = 0; silent_frames < s->buffered_steps; silent_frames++)

         if (!s->steps[silent_frames]->silence)

             break;

     if (--silent_frames < 0)

         return 0;


     for (fsize = CELT_BLOCK_960; fsize > CELT_BLOCK_120; fsize--) {

         if ((1 << fsize) > silent_frames)

             continue;

         s->p.frames = FFMIN(silent_frames / (1 << fsize), 48 >> fsize);

         s->p.framesize = fsize;

         return 1;

     }


     return 0;

 }


 /* Main function which decides frame size and frames per current packet */

 static void psy_output_groups(OpusPsyContext *s)

 {

     int max_delay_samples = (s->options->max_delay_ms*s->avctx->sample_rate)/1000;

     int max_bsize = FFMIN(OPUS_SAMPLES_TO_BLOCK_SIZE(max_delay_samples), CELT_BLOCK_960);


     /* These don't change for now */

     s->p.mode      = OPUS_MODE_CELT;

     s->p.bandwidth = OPUS_BANDWIDTH_FULLBAND;


     /* Flush silent frames ASAP */

     if (s->steps[0]->silence && flush_silent_frames(s))

         return;


     s->p.framesize = FFMIN(max_bsize, CELT_BLOCK_960);

     s->p.frames    = 1;

 }


 int ff_opus_psy_process(OpusPsyContext *s, OpusPacketInfo *p)

 {

     int i;

     float total_energy_change = 0.0f;


     if (s->buffered_steps < s->max_steps && !s->eof) {

         const int awin = (1 << s->bsize_analysis);

         if (++s->steps_to_process >= awin) {

             step_collect_psy_metrics(s, s->buffered_steps - awin + 1);

             s->steps_to_process = 0;

         }

         if ((++s->buffered_steps) < s->max_steps)

             return 1;

     }


     for (i = 0; i < s->buffered_steps; i++)

         total_energy_change += s->steps[i]->total_change;


     search_for_change_points(s, total_energy_change / 2.0f, 0,

                              s->buffered_steps, 1, 0);


     psy_output_groups(s);


     p->frames    = s->p.frames;

     p->framesize = s->p.framesize;

     p->mode      = s->p.mode;

     p->bandwidth = s->p.bandwidth;


     return 0;

 }


 void ff_opus_psy_celt_frame_init(OpusPsyContext *s, CeltFrame *f, int index)

 {

     int i, neighbouring_points = 0, start_offset = 0;

     int radius = (1 << s->p.framesize), step_offset = radius*index;

     int silence = 1;


     f->start_band = (s->p.mode == OPUS_MODE_HYBRID) ? 17 : 0;

     f->end_band   = ff_celt_band_end[s->p.bandwidth];

     f->channels   = s->avctx->channels;

     f->size       = s->p.framesize;


     for (i = 0; i < (1 << f->size); i++)

         silence &= s->steps[index*(1 << f->size) + i]->silence;


     f->silence = silence;

     if (f->silence) {

         f->framebits = 0; /* Otherwise the silence flag eats up 16(!) bits */

         return;

     }


     for (i = 0; i < s->inflection_points_count; i++) {

         if (s->inflection_points[i] >= step_offset) {

             start_offset = i;

             break;

         }

     }


     for (i = start_offset; i < FFMIN(radius, s->inflection_points_count - start_offset); i++) {

         if (s->inflection_points[i] < (step_offset + radius)) {

             neighbouring_points++;

         }

     }


     /* Transient flagging */

     f->transient = neighbouring_points > 0;

     f->blocks = f->transient ? OPUS_BLOCK_SIZE(s->p.framesize)/CELT_OVERLAP : 1;


     /* Some sane defaults */

     f->pfilter   = 0;

     f->pf_gain   = 0.5f;

     f->pf_octave = 2;

     f->pf_period = 1;

     f->pf_tapset = 2;


     /* More sane defaults */

     f->tf_select = 0;

     f->anticollapse = 1;

     f->alloc_trim = 5;

     f->skip_band_floor = f->end_band;

     f->intensity_stereo = f->end_band;

     f->dual_stereo = 0;

     f->spread = CELT_SPREAD_NORMAL;

     memset(f->tf_change, 0, sizeof(int)*CELT_MAX_BANDS);

     memset(f->alloc_boost, 0, sizeof(int)*CELT_MAX_BANDS);

 }


 static void celt_gauge_psy_weight(OpusPsyContext *s, OpusPsyStep **start,

                                   CeltFrame *f_out)

 {

     int i, f, ch;

     int frame_size = OPUS_BLOCK_SIZE(s->p.framesize);

     float rate, frame_bits = 0;


     /* Used for the global ROTATE flag */

     float tonal = 0.0f;


     /* Pseudo-weights */

     float band_score[CELT_MAX_BANDS] = { 0 };

     float max_score = 1.0f;


     /* Pass one - one loop around each band, computing unquant stuff */

     for (i = 0; i < CELT_MAX_BANDS; i++) {

         float weight = 0.0f;

         float tonal_contrib = 0.0f;

         for (f = 0; f < (1 << s->p.framesize); f++) {

             weight = start[f]->stereo[i];

             for (ch = 0; ch < s->avctx->channels; ch++) {

                 weight += start[f]->change_amp[ch][i] + start[f]->tone[ch][i] + start[f]->energy[ch][i];

                 tonal_contrib += start[f]->tone[ch][i];

             }

         }

         tonal += tonal_contrib;

         band_score[i] = weight;

     }


     tonal /= (float)CELT_MAX_BANDS;


     for (i = 0; i < CELT_MAX_BANDS; i++) {

         if (band_score[i] > max_score)

             max_score = band_score[i];

     }


     for (i = 0; i < CELT_MAX_BANDS; i++) {

         f_out->alloc_boost[i] = (int)((band_score[i]/max_score)*3.0f);

         frame_bits += band_score[i]*8.0f;

     }


     tonal /= 1333136.0f;

     f_out->spread = av_clip_uintp2(lrintf(tonal), 2);


     rate = ((float)s->avctx->bit_rate) + frame_bits*frame_size*16;

     rate *= s->lambda;

     rate /= s->avctx->sample_rate/frame_size;


     f_out->framebits = lrintf(rate);

     f_out->framebits = FFMIN(f_out->framebits, OPUS_MAX_PACKET_SIZE*8);

     f_out->framebits = FFALIGN(f_out->framebits, 8);

 }


 static int bands_dist(OpusPsyContext *s, CeltFrame *f, float *total_dist)

 {

     int i, tdist = 0.0f;

     OpusRangeCoder dump;


     ff_opus_rc_enc_init(&dump);

     ff_celt_enc_bitalloc(&dump, f);


     for (i = 0; i < CELT_MAX_BANDS; i++) {

         float bits = 0.0f;

         float dist = f->pvq->band_cost(f->pvq, f, &dump, i, &bits, s->lambda);

         tdist += dist;

     }


     *total_dist = tdist;


     return 0;

 }


 static void celt_search_for_dual_stereo(OpusPsyContext *s, CeltFrame *f)

 {

     float td1, td2;

     f->dual_stereo = 0;

     bands_dist(s, f, &td1);

     f->dual_stereo = 1;

     bands_dist(s, f, &td2);


     f->dual_stereo = td2 < td1;

     s->dual_stereo_used += td2 < td1;

 }


 static void celt_search_for_intensity(OpusPsyContext *s, CeltFrame *f)

 {

     int i, best_band = CELT_MAX_BANDS - 1;

     float dist, best_dist = FLT_MAX;


     /* TODO: fix, make some heuristic up here using the lambda value */

     float end_band = 0;


     for (i = f->end_band; i >= end_band; i--) {

         f->intensity_stereo = i;

         bands_dist(s, f, &dist);

         if (best_dist > dist) {

             best_dist = dist;

             best_band = i;

         }

     }


     f->intensity_stereo = best_band;

     s->avg_is_band = (s->avg_is_band + f->intensity_stereo)/2.0f;

 }


 static int celt_search_for_tf(OpusPsyContext *s, OpusPsyStep **start, CeltFrame *f)

 {

     int i, j, k, cway, config[2][CELT_MAX_BANDS] = { { 0 } };

     float score[2] = { 0 };


     for (cway = 0; cway < 2; cway++) {

         int mag[2];

         int base = f->transient ? 120 : 960;

         int i;


         for (i = 0; i < 2; i++) {

             int c = ff_celt_tf_select[f->size][f->transient][cway][i];

             mag[i] = c < 0 ? base >> FFABS(c) : base << FFABS(c);

         }


         for (i = 0; i < CELT_MAX_BANDS; i++) {

             float iscore0 = 0.0f;

             float iscore1 = 0.0f;

             for (j = 0; j < (1 << f->size); j++) {

                 for (k = 0; k < s->avctx->channels; k++) {

                     iscore0 += start[j]->tone[k][i]*start[j]->change_amp[k][i]/mag[0];

                     iscore1 += start[j]->tone[k][i]*start[j]->change_amp[k][i]/mag[1];

                 }

             }

             config[cway][i] = FFABS(iscore0 - 1.0f) < FFABS(iscore1 - 1.0f);

             score[cway] += config[cway][i] ? iscore1 : iscore0;

         }

     }


     f->tf_select = score[0] < score[1];

     memcpy(f->tf_change, config[f->tf_select], sizeof(int)*CELT_MAX_BANDS);


     return 0;

 }


 int ff_opus_psy_celt_frame_process(OpusPsyContext *s, CeltFrame *f, int index)

 {

     int start_transient_flag = f->transient;

     OpusPsyStep **start = &s->steps[index * (1 << s->p.framesize)];


     if (f->silence)

         return 0;


     celt_gauge_psy_weight(s, start, f);

     celt_search_for_intensity(s, f);

     celt_search_for_dual_stereo(s, f);

     celt_search_for_tf(s, start, f);


     if (f->transient != start_transient_flag) {

         f->blocks = f->transient ? OPUS_BLOCK_SIZE(s->p.framesize)/CELT_OVERLAP : 1;

         s->redo_analysis = 1;

         return 1;

     }


     s->redo_analysis = 0;


     return 0;

 }


 void ff_opus_psy_postencode_update(OpusPsyContext *s, CeltFrame *f, OpusRangeCoder *rc)

 {

     int i, frame_size = OPUS_BLOCK_SIZE(s->p.framesize);

     int steps_out = s->p.frames*(frame_size/120);

     void *tmp[FF_BUFQUEUE_SIZE];

     float ideal_fbits;


     for (i = 0; i < steps_out; i++)

         memset(s->steps[i], 0, sizeof(OpusPsyStep));


     for (i = 0; i < s->max_steps; i++)

         tmp[i] = s->steps[i];


     for (i = 0; i < s->max_steps; i++) {

         const int i_new = i - steps_out;

         s->steps[i_new < 0 ? s->max_steps + i_new : i_new] = tmp[i];

     }


     for (i = steps_out; i < s->buffered_steps; i++)

         s->steps[i]->index -= steps_out;


     ideal_fbits = s->avctx->bit_rate/(s->avctx->sample_rate/frame_size);


     for (i = 0; i < s->p.frames; i++) {

         s->avg_is_band += f[i].intensity_stereo;

         s->lambda *= ideal_fbits / f[i].framebits;

     }


     s->avg_is_band /= (s->p.frames + 1);


     s->cs_num = 0;

     s->steps_to_process = 0;

     s->buffered_steps -= steps_out;

     s->total_packets_out += s->p.frames;

     s->inflection_points_count = 0;

 }


 av_cold int ff_opus_psy_init(OpusPsyContext *s, AVCodecContext *avctx,

                              struct FFBufQueue *bufqueue, OpusEncOptions *options)

 {

     int i, ch, ret;


     s->redo_analysis = 0;

     s->lambda = 1.0f;

     s->options = options;

     s->avctx = avctx;

     s->bufqueue = bufqueue;

     s->max_steps = ceilf(s->options->max_delay_ms/2.5f);

     s->bsize_analysis = CELT_BLOCK_960;

     s->avg_is_band = CELT_MAX_BANDS - 1;

     s->inflection_points_count = 0;


     s->inflection_points = av_mallocz(sizeof(*s->inflection_points)*s->max_steps);

     if (!s->inflection_points) {

         ret = AVERROR(ENOMEM);

         goto fail;

     }


     s->dsp = avpriv_float_dsp_alloc(avctx->flags & AV_CODEC_FLAG_BITEXACT);

     if (!s->dsp) {

         ret = AVERROR(ENOMEM);

         goto fail;

     }


     for (ch = 0; ch < s->avctx->channels; ch++) {

         for (i = 0; i < CELT_MAX_BANDS; i++) {

             bessel_init(&s->bfilter_hi[ch][i], 1.0f, 19.0f, 100.0f, 1);

             bessel_init(&s->bfilter_lo[ch][i], 1.0f, 20.0f, 100.0f, 0);

         }

     }


     for (i = 0; i < s->max_steps; i++) {

         s->steps[i] = av_mallocz(sizeof(OpusPsyStep));

         if (!s->steps[i]) {

             ret = AVERROR(ENOMEM);

             goto fail;

         }

     }


     for (i = 0; i < CELT_BLOCK_NB; i++) {

         float tmp;

         const int len = OPUS_BLOCK_SIZE(i);

         s->window[i] = av_malloc(2*len*sizeof(float));

         if (!s->window[i]) {

             ret = AVERROR(ENOMEM);

             goto fail;

         }

         generate_window_func(s->window[i], 2*len, WFUNC_SINE, &tmp);

         if ((ret = ff_mdct15_init(&s->mdct[i], 0, i + 3, 68 << (CELT_BLOCK_NB - 1 - i))))

             goto fail;

     }


     return 0;


 fail:

     av_freep(&s->inflection_points);

     av_freep(&s->dsp);


     for (i = 0; i < CELT_BLOCK_NB; i++) {

         ff_mdct15_uninit(&s->mdct[i]);

         av_freep(&s->window[i]);

     }


     for (i = 0; i < s->max_steps; i++)

         av_freep(&s->steps[i]);


     return ret;

 }


 void ff_opus_psy_signal_eof(OpusPsyContext *s)

 {

     s->eof = 1;

 }


 av_cold int ff_opus_psy_end(OpusPsyContext *s)

 {

     int i;


     av_freep(&s->inflection_points);

     av_freep(&s->dsp);


     for (i = 0; i < CELT_BLOCK_NB; i++) {

         ff_mdct15_uninit(&s->mdct[i]);

         av_freep(&s->window[i]);

     }


     for (i = 0; i < s->max_steps; i++)

         av_freep(&s->steps[i]);


     av_log(s->avctx, AV_LOG_INFO, "Average Intensity Stereo band: %0.1f\n", s->avg_is_band);

     av_log(s->avctx, AV_LOG_INFO, "Dual Stereo used: %0.2f%%\n", ((float)s->dual_stereo_used/s->total_packets_out)*100.0f);


     return 0;

 }

CeltFrame::channels
int channels
Definition: opus_celt.h:99

OpusEncOptions::max_delay_ms
float max_delay_ms
Definition: opusenc.h:44

OpusPsyContext::mdct
MDCT15Context * mdct[CELT_BLOCK_NB]
Definition: opusenc_psy.h:71

ff_opus_psy_celt_frame_init
void ff_opus_psy_celt_frame_init(OpusPsyContext *s, CeltFrame *f, int index)
Definition: opusenc_psy.c:204

flush_silent_frames
static int flush_silent_frames(OpusPsyContext *s)
Definition: opusenc_psy.c:134

OPUS_BANDWIDTH_FULLBAND
Definition: opus.h:75

OPUS_SAMPLES_TO_BLOCK_SIZE
#define OPUS_SAMPLES_TO_BLOCK_SIZE(x)
Definition: opusenc.h:41

OpusPsyContext::avctx
AVCodecContext * avctx
Definition: opusenc_psy.h:55

OpusPsyContext::total_packets_out
int64_t total_packets_out
Definition: opusenc_psy.h:80

CeltFrame::anticollapse
int anticollapse
Definition: opus_celt.h:116

OpusPacketInfo::bandwidth
enum OpusBandwidth bandwidth
Definition: opusenc.h:49

s
const char * s
Definition: avisynth_c.h:768

OpusPsyContext::bufqueue
struct FFBufQueue * bufqueue
Definition: opusenc_psy.h:57

OpusPsyContext::cs_num
int cs_num
Definition: opusenc_psy.h:61

AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:201

CeltFrame::framebits
int framebits
Definition: opus_celt.h:130

OpusPsyContext::window
float * window[CELT_BLOCK_NB]
Definition: opusenc_psy.h:70

ff_opus_rc_enc_init
void ff_opus_rc_enc_init(OpusRangeCoder *rc)
Definition: opus_rc.c:402

AVCodecContext::bit_rate
int64_t bit_rate
the average bitrate
Definition: avcodec.h:1826

config
static FFServerConfig config
Definition: ffserver.c:193

OpusPsyContext::steps
OpusPsyStep * steps[FF_BUFQUEUE_SIZE+1]
Definition: opusenc_psy.h:67

OpusPsyContext::bfilter_hi
FFBesselFilter bfilter_hi[OPUS_MAX_CHANNELS][CELT_MAX_BANDS]
Definition: opusenc_psy.h:65

OpusPsyContext::bfilter_lo
FFBesselFilter bfilter_lo[OPUS_MAX_CHANNELS][CELT_MAX_BANDS]
Definition: opusenc_psy.h:64

ff_celt_freq_bands
const uint8_t ff_celt_freq_bands[]
Definition: opustab.c:763

generate_window_func
static void generate_window_func(float *lut, int N, int win_func, float *overlap)
Definition: window_func.h:35

av_mallocz
void * av_mallocz(size_t size)
Allocate a memory block with alignment suitable for all memory accesses (including vectors if availab...
Definition: mem.c:222

OpusPsyContext::buffered_steps
int buffered_steps
Definition: opusenc_psy.h:86

OPUS_MAX_PACKET_SIZE
#define OPUS_MAX_PACKET_SIZE
Definition: opus_rc.h:29

OPUS_MODE_CELT
Definition: opus.h:65

CeltFrame::pf_period
int pf_period
Definition: opus_celt.h:125

ff_celt_enc_bitalloc
void ff_celt_enc_bitalloc(OpusRangeCoder *rc, CeltFrame *f)
Definition: opusenc.c:285

mdct15.h

FFBufQueue
Structure holding the queue.
Definition: bufferqueue.h:49

ff_celt_band_end
const uint8_t ff_celt_band_end[]
Definition: opustab.c:27

OpusPsyStep::coeffs
float coeffs[OPUS_MAX_CHANNELS][OPUS_BLOCK_SIZE(CELT_BLOCK_960)]
Definition: opusenc_psy.h:40

OpusBandExcitation::excitation
float excitation
Definition: opusenc_psy.h:44

OpusPacketInfo::frames
int frames
Definition: opusenc.h:51

OpusPsyContext::options
OpusEncOptions * options
Definition: opusenc_psy.h:58

CELT_SPREAD_NORMAL
Definition: opus_celt.h:52

OpusPsyStep::silence
int silence
Definition: opusenc_psy.h:32

bessel_filter
static float bessel_filter(FFBesselFilter *s, float x)
Definition: opusenc_utils.h:76

bits
uint8_t bits
Definition: crc.c:296

av_cold
#define av_cold
Definition: attributes.h:82

CELT_OVERLAP
#define CELT_OVERLAP
Definition: opus.h:42

av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31

CeltFrame::silence
int silence
Definition: opus_celt.h:114

OpusPsyContext::inflection_points
int * inflection_points
Definition: opusenc_psy.h:90

OpusBandExcitation::excitation_init
float excitation_init
Definition: opusenc_psy.h:46

OpusPsyStep::stereo
float stereo[CELT_MAX_BANDS]
Definition: opusenc_psy.h:35

ch
uint8_t pi<< 24) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_U8,(uint64_t)((*(constuint8_t *) pi-0x80U))<< 56) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8,(*(constuint8_t *) pi-0x80)*(1.0f/(1<< 7))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8,(*(constuint8_t *) pi-0x80)*(1.0/(1<< 7))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16,(*(constint16_t *) pi >>8)+0x80) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_S16,(uint64_t)(*(constint16_t *) pi)<< 48) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16,*(constint16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16,*(constint16_t *) pi *(1.0/(1<< 15))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32,(*(constint32_t *) pi >>24)+0x80) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_S32,(uint64_t)(*(constint32_t *) pi)<< 32) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32,*(constint32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32,*(constint32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S64,(*(constint64_t *) pi >>56)+0x80) CONV_FUNC(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S64,*(constint64_t *) pi *(1.0f/(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S64,*(constint64_t *) pi *(1.0/(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, av_clip_uint8(lrintf(*(constfloat *) pi *(1<< 7))+0x80)) CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, av_clip_int16(lrintf(*(constfloat *) pi *(1<< 15)))) CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, av_clipl_int32(llrintf(*(constfloat *) pi *(1U<< 31)))) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_FLT, llrintf(*(constfloat *) pi *(INT64_C(1)<< 63))) CONV_FUNC(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, av_clip_uint8(lrint(*(constdouble *) pi *(1<< 7))+0x80)) CONV_FUNC(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, av_clip_int16(lrint(*(constdouble *) pi *(1<< 15)))) CONV_FUNC(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, av_clipl_int32(llrint(*(constdouble *) pi *(1U<< 31)))) CONV_FUNC(AV_SAMPLE_FMT_S64, int64_t, AV_SAMPLE_FMT_DBL, llrint(*(constdouble *) pi *(INT64_C(1)<< 63)))#defineFMT_PAIR_FUNC(out, in) staticconv_func_type *constfmt_pair_to_conv_functions[AV_SAMPLE_FMT_NB *AV_SAMPLE_FMT_NB]={FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_U8), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S16), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S32), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_FLT), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_DBL), FMT_PAIR_FUNC(AV_SAMPLE_FMT_U8, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S16, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S32, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_FLT, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_DBL, AV_SAMPLE_FMT_S64), FMT_PAIR_FUNC(AV_SAMPLE_FMT_S64, AV_SAMPLE_FMT_S64),};staticvoidcpy1(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, len);}staticvoidcpy2(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, 2 *len);}staticvoidcpy4(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, 4 *len);}staticvoidcpy8(uint8_t **dst, constuint8_t **src, intlen){memcpy(*dst,*src, 8 *len);}AudioConvert *swri_audio_convert_alloc(enumAVSampleFormatout_fmt, enumAVSampleFormatin_fmt, intchannels, constint *ch_map, intflags){AudioConvert *ctx;conv_func_type *f=fmt_pair_to_conv_functions[av_get_packed_sample_fmt(out_fmt)+AV_SAMPLE_FMT_NB *av_get_packed_sample_fmt(in_fmt)];if(!f) returnNULL;ctx=av_mallocz(sizeof(*ctx));if(!ctx) returnNULL;if(channels==1){in_fmt=av_get_planar_sample_fmt(in_fmt);out_fmt=av_get_planar_sample_fmt(out_fmt);}ctx->channels=channels;ctx->conv_f=f;ctx->ch_map=ch_map;if(in_fmt==AV_SAMPLE_FMT_U8||in_fmt==AV_SAMPLE_FMT_U8P) memset(ctx->silence, 0x80, sizeof(ctx->silence));if(out_fmt==in_fmt &&!ch_map){switch(av_get_bytes_per_sample(in_fmt)){case1:ctx->simd_f=cpy1;break;case2:ctx->simd_f=cpy2;break;case4:ctx->simd_f=cpy4;break;case8:ctx->simd_f=cpy8;break;}}if(HAVE_X86ASM &&1) swri_audio_convert_init_x86(ctx, out_fmt, in_fmt, channels);if(ARCH_ARM) swri_audio_convert_init_arm(ctx, out_fmt, in_fmt, channels);if(ARCH_AARCH64) swri_audio_convert_init_aarch64(ctx, out_fmt, in_fmt, channels);returnctx;}voidswri_audio_convert_free(AudioConvert **ctx){av_freep(ctx);}intswri_audio_convert(AudioConvert *ctx, AudioData *out, AudioData *in, intlen){intch;intoff=0;constintos=(out->planar?1:out->ch_count)*out->bps;unsignedmisaligned=0;av_assert0(ctx->channels==out->ch_count);if(ctx->in_simd_align_mask){intplanes=in->planar?in->ch_count:1;unsignedm=0;for(ch=0;ch< planes;ch++) m|=(intptr_t) in->ch[ch];misaligned|=m &ctx->in_simd_align_mask;}if(ctx->out_simd_align_mask){intplanes=out->planar?out->ch_count:1;unsignedm=0;for(ch=0;ch< planes;ch++) m|=(intptr_t) out->ch[ch];misaligned|=m &ctx->out_simd_align_mask;}if(ctx->simd_f &&!ctx->ch_map &&!misaligned){off=len &~15;av_assert1(off >=0);av_assert1(off<=len);av_assert2(ctx->channels==SWR_CH_MAX||!in->ch[ctx->channels]);if(off >0){if(out->planar==in->planar){intplanes=out->planar?out->ch_count:1;for(ch=0;ch< planes;ch++){ctx->simd_f(out-> ch ch
Definition: audioconvert.c:56

ff_opus_psy_process
int ff_opus_psy_process(OpusPsyContext *s, OpusPacketInfo *p)
Definition: opusenc_psy.c:173

ff_mdct15_init
av_cold int ff_mdct15_init(MDCT15Context **ps, int inverse, int N, double scale)
Definition: mdct15.c:247

CeltFrame::dual_stereo
int dual_stereo
Definition: opus_celt.h:118

ff_opus_psy_celt_frame_process
int ff_opus_psy_celt_frame_process(OpusPsyContext *s, CeltFrame *f, int index)
Definition: opusenc_psy.c:400

OpusPacketInfo::mode
enum OpusMode mode
Definition: opusenc.h:48

lrintf
#define lrintf(x)
Definition: libm_mips.h:70

CeltFrame::skip_band_floor
int skip_band_floor
Definition: opus_celt.h:108

options
const OptionDef options[]
Definition: ffserver.c:3948

FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:48

av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28

CeltFrame::end_band
int end_band
Definition: opus_celt.h:104

CELT_BLOCK_960
Definition: opus_celt.h:60

OpusPacketInfo
Definition: opusenc.h:47

expf
#define expf(x)
Definition: libm.h:283

CeltFrame::alloc_boost
int alloc_boost[CELT_MAX_BANDS]
Definition: opus_celt.h:111

bands_dist
static int bands_dist(OpusPsyContext *s, CeltFrame *f, float *total_dist)
Definition: opusenc_psy.c:313

avpriv_float_dsp_alloc
av_cold AVFloatDSPContext * avpriv_float_dsp_alloc(int bit_exact)
Allocate a float DSP context.
Definition: float_dsp.c:127

OpusPsyContext::dsp
AVFloatDSPContext * dsp
Definition: opusenc_psy.h:56

AVFloatDSPContext::vector_fmul
void(* vector_fmul)(float *dst, const float *src0, const float *src1, int len)
Calculate the entry wise product of two vectors of floats and store the result in a vector of floats...
Definition: float_dsp.h:38

OPUS_BLOCK_SIZE
#define OPUS_BLOCK_SIZE(x)
Definition: opusenc.h:39

AVERROR
#define AVERROR(e)
Definition: error.h:43

CeltFrame::start_band
int start_band
Definition: opus_celt.h:103

WFUNC_SINE
Definition: window_func.h:30

AVCodecContext::flags
int flags
AV_CODEC_FLAG_*.
Definition: avcodec.h:1856

CELT_BLOCK_120
Definition: opus_celt.h:57

ff_opus_psy_init
av_cold int ff_opus_psy_init(OpusPsyContext *s, AVCodecContext *avctx, struct FFBufQueue *bufqueue, OpusEncOptions *options)
Definition: opusenc_psy.c:461

FF_BUFQUEUE_SIZE
#define FF_BUFQUEUE_SIZE
Definition: audiotoolboxenc.c:25

CeltFrame::tf_change
int tf_change[CELT_MAX_BANDS]
Definition: opus_celt.h:137

OpusPsyStep::total_change
float total_change
Definition: opusenc_psy.h:37

OpusPsyContext::eof
int eof
Definition: opusenc_psy.h:88

OpusPsyContext
Definition: opusenc_psy.h:54

CeltFrame::pfilter
int pfilter
Definition: opus_celt.h:107

offset
static const uint8_t offset[127][2]
Definition: vf_spp.c:92

FFMAX
#define FFMAX(a, b)
Definition: common.h:94

fail
#define fail()
Definition: checkasm.h:109

CeltFrame::pf_gain
float pf_gain
Definition: opus_celt.h:127

OpusPsyContext::redo_analysis
int redo_analysis
Definition: opusenc_psy.h:85

celt_search_for_dual_stereo
static void celt_search_for_dual_stereo(OpusPsyContext *s, CeltFrame *f)
Definition: opusenc_psy.c:332

OpusPsyStep::bands
float * bands[OPUS_MAX_CHANNELS][CELT_MAX_BANDS]
Definition: opusenc_psy.h:39

ff_celt_tf_select
const int8_t ff_celt_tf_select[4][2][2][2]
Definition: opustab.c:777

celt_gauge_psy_weight
static void celt_gauge_psy_weight(OpusPsyContext *s, OpusPsyStep **start, CeltFrame *f_out)
Definition: opusenc_psy.c:260

celt_search_for_tf
static int celt_search_for_tf(OpusPsyContext *s, OpusPsyStep **start, CeltFrame *f)
Definition: opusenc_psy.c:365

AV_CODEC_FLAG_BITEXACT
#define AV_CODEC_FLAG_BITEXACT
Use only bitexact stuff (except (I)DCT).
Definition: avcodec.h:929

FFMIN
#define FFMIN(a, b)
Definition: common.h:96

OpusPsyStep::tone
float tone[OPUS_MAX_CHANNELS][CELT_MAX_BANDS]
Definition: opusenc_psy.h:34

OpusPsyStep::change_amp
float change_amp[OPUS_MAX_CHANNELS][CELT_MAX_BANDS]
Definition: opusenc_psy.h:36

opus_pvq.h

OpusPsyContext::lambda
float lambda
Definition: opusenc_psy.h:89

psy_output_groups
static void psy_output_groups(OpusPsyContext *s)
Definition: opusenc_psy.c:156

OpusPsyContext::avg_is_band
float avg_is_band
Definition: opusenc_psy.h:78

FFABS
#define FFABS(a)
Absolute value, Note, INT_MIN / INT64_MIN result in undefined behavior as they are not representable ...
Definition: common.h:72

CeltFrame::blocks
int blocks
Definition: opus_celt.h:112

OpusPsyContext::inflection_points_count
int inflection_points_count
Definition: opusenc_psy.h:91

CeltFrame::transient
int transient
Definition: opus_celt.h:106

ff_celt_freq_range
const uint8_t ff_celt_freq_range[]
Definition: opustab.c:767

OpusRangeCoder
Definition: opus_rc.h:40

CeltPVQ::band_cost
float(* band_cost)(struct CeltPVQ *pvq, CeltFrame *f, OpusRangeCoder *rc, int band, float *bits, float lambda)
Definition: opus_pvq.h:43

AV_LOG_INFO
#define AV_LOG_INFO
Standard information.
Definition: log.h:187

frame_size
int frame_size
Definition: mxfenc.c:1896

opusenc_psy.h

CELT_MAX_BANDS
#define CELT_MAX_BANDS
Definition: opus.h:45

AVCodecContext::sample_rate
int sample_rate
samples per second
Definition: avcodec.h:2523

CeltFrame::pf_tapset
int pf_tapset
Definition: opus_celt.h:126

AVCodecContext
main external API structure.
Definition: avcodec.h:1761

bessel_init
static int bessel_init(FFBesselFilter *s, float n, float f0, float fs, int highpass)
Definition: opusenc_utils.h:69

ff_opus_psy_signal_eof
void ff_opus_psy_signal_eof(OpusPsyContext *s)
Definition: opusenc_psy.c:533

OpusPsyContext::scratch
float scratch[2048]
Definition: opusenc_psy.h:74

index
int index
Definition: gxfenc.c:89

qsort.h

celt_search_for_intensity
static void celt_search_for_intensity(OpusPsyContext *s, CeltFrame *f)
Definition: opusenc_psy.c:344

OpusPsyContext::dual_stereo_used
int64_t dual_stereo_used
Definition: opusenc_psy.h:79

OpusPsyContext::p
OpusPacketInfo p
Definition: opusenc_psy.h:84

ff_opus_psy_end
av_cold int ff_opus_psy_end(OpusPsyContext *s)
Definition: opusenc_psy.c:538

CeltFrame::pvq
CeltPVQ * pvq
Definition: opus_celt.h:98

CELT_BLOCK_NB
Definition: opus_celt.h:62

ff_opus_psy_postencode_update
void ff_opus_psy_postencode_update(OpusPsyContext *s, CeltFrame *f, OpusRangeCoder *rc)
Definition: opusenc_psy.c:424

weight
static int weight(int i, int blen, int offset)
Definition: diracdec.c:1522

OpusPacketInfo::framesize
int framesize
Definition: opusenc.h:50

level
uint8_t level
Definition: svq3.c:207

OpusPsyContext::max_steps
int max_steps
Definition: opusenc_psy.h:68

int
int
Definition: ffmpeg_filter.c:190

OpusPsyStep::index
int index
Definition: opusenc_psy.h:31

CeltFrame
Definition: opus_celt.h:92

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

OpusBandExcitation::excitation_dist
float excitation_dist
Definition: opusenc_psy.h:45

CeltFrame::spread
enum CeltSpread spread
Definition: opus_celt.h:121

ff_mdct15_uninit
av_cold void ff_mdct15_uninit(MDCT15Context **ps)
Definition: mdct15.c:43

CeltFrame::tf_select
int tf_select
Definition: opus_celt.h:109

coeffs
static const int16_t coeffs[]
Definition: simple_idct_mmi.c:40

len
int len
Definition: vorbis_enc_data.h:452

step_collect_psy_metrics
static void step_collect_psy_metrics(OpusPsyContext *s, int index)
Definition: opusenc_psy.c:29

AVCodecContext::channels
int channels
number of audio channels
Definition: avcodec.h:2524

av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35

start
void INT64 start
Definition: avisynth_c.h:690

OpusPsyStep::energy
float energy[OPUS_MAX_CHANNELS][CELT_MAX_BANDS]
Definition: opusenc_psy.h:33

fsize
static int64_t fsize(FILE *f)
Definition: audiomatch.c:28

search_for_change_points
static void search_for_change_points(OpusPsyContext *s, float tgt_change, int offset_s, int offset_e, int resolution, int level)
Definition: opusenc_psy.c:114

CeltFrame::size
enum CeltBlockSize size
Definition: opus_celt.h:102

CeltFrame::alloc_trim
int alloc_trim
Definition: opus_celt.h:110

AVFrame::extended_data
uint8_t ** extended_data
pointers to the data planes/channels.
Definition: frame.h:248

MDCT15Context::mdct
void(* mdct)(struct MDCT15Context *s, float *dst, const float *src, ptrdiff_t stride)
Definition: mdct15.h:49

OpusEncOptions
Definition: opusenc.h:43

OPUS_MODE_HYBRID
Definition: opus.h:64

AVFrame::nb_samples
int nb_samples
number of audio samples (per channel) described by this frame
Definition: frame.h:267

OpusPsyStep
Definition: opusenc_psy.h:30

for
for(j=16;j >0;--j)
Definition: h264pred_template.c:469

CeltFrame::pf_octave
int pf_octave
Definition: opus_celt.h:124

OpusBandExcitation
Definition: opusenc_psy.h:43

CeltFrame::intensity_stereo
int intensity_stereo
Definition: opus_celt.h:117

opustab.h

OpusPsyContext::bsize_analysis
int bsize_analysis
Definition: opusenc_psy.h:72

OpusPsyContext::ex
OpusBandExcitation ex[OPUS_MAX_CHANNELS][CELT_MAX_BANDS]
Definition: opusenc_psy.h:63

ff_bufqueue_peek
static AVFrame * ff_bufqueue_peek(struct FFBufQueue *queue, unsigned index)
Get a buffer from the queue without altering it.
Definition: bufferqueue.h:87

tmp
static uint8_t tmp[11]
Definition: aes_ctr.c:26

OpusPsyContext::steps_to_process
int steps_to_process
Definition: opusenc_psy.h:87