#include <float.h>
#include "libavutil/avassert.h"
#include "libavutil/channel_layout.h"
#include "libavutil/mem.h"
#include "libavutil/opt.h"
#include "bufferqueue.h"
#include "audio.h"
#include "avfilter.h"
#include "filters.h"

Data Structures
struct	PeriodItem

struct	ChannelContext

struct	SpeechNormalizerContext

Macros
#define	FF_BUFQUEUE_SIZE (1024)

#define	MAX_ITEMS 882000

#define	MIN_PEAK (1. / 32768.)

#define	OFFSET(x) offsetof(SpeechNormalizerContext, x)

#define	FLAGS AV_OPT_FLAG_AUDIO_PARAM\|AV_OPT_FLAG_FILTERING_PARAM\|AV_OPT_FLAG_RUNTIME_PARAM

#define	ANALYZE_CHANNEL(name, ptype, zero, min_peak)

#define	FILTER_CHANNELS(name, ptype)

#define	FILTER_LINK_CHANNELS(name, ptype, tlerp)

Functions
	AVFILTER_DEFINE_CLASS (speechnorm)

static int	get_pi_samples (PeriodItem *pi, int start, int end, int remain)

static int	available_samples (AVFilterContext *ctx)

static void	consume_pi (ChannelContext *cc, int nb_samples)

static double	next_gain (AVFilterContext *ctx, double pi_max_peak, int bypass, double state, double pi_rms_sum, int pi_size)

static void	next_pi (AVFilterContext ctx, ChannelContext cc, int bypass)

static double	min_gain (AVFilterContext ctx, ChannelContext cc, int max_size)

static double	dlerp (double min, double max, double mix)

static float	flerp (float min, float max, float mix)

static int	filter_frame (AVFilterContext *ctx)

static int	activate (AVFilterContext *ctx)

static int	config_input (AVFilterLink *inlink)

static int	process_command (AVFilterContext ctx, const char cmd, const char args, char res, int res_len, int flags)

static av_cold void	uninit (AVFilterContext *ctx)

Variables
static const AVOption	speechnorm_options []

static const AVFilterPad	inputs []

const FFFilter	ff_af_speechnorm

Detailed Description

Speech Normalizer

Definition in file af_speechnorm.c.

Macro Definition Documentation

◆ FF_BUFQUEUE_SIZE

#define FF_BUFQUEUE_SIZE (1024)

Definition at line 35 of file af_speechnorm.c.

◆ MAX_ITEMS

#define MAX_ITEMS 882000

Definition at line 42 of file af_speechnorm.c.

◆ MIN_PEAK

#define MIN_PEAK (1. / 32768.)

Definition at line 43 of file af_speechnorm.c.

◆ OFFSET

#define OFFSET ( x ) offsetof(SpeechNormalizerContext, x)

Definition at line 94 of file af_speechnorm.c.

◆ FLAGS

#define FLAGS AV_OPT_FLAG_AUDIO_PARAM|AV_OPT_FLAG_FILTERING_PARAM|AV_OPT_FLAG_RUNTIME_PARAM

Definition at line 95 of file af_speechnorm.c.

◆ ANALYZE_CHANNEL

#define ANALYZE_CHANNEL	(	name,
		ptype,
		zero,
		min_peak
	)

Definition at line 235 of file af_speechnorm.c.

◆ FILTER_CHANNELS

#define FILTER_CHANNELS	(	name,
		ptype
	)

Value:

static void filter_channels_## name (AVFilterContext *ctx,                      \
                                     AVFrame *in, AVFrame *out, int nb_samples) \
{                                                                               \
    SpeechNormalizerContext *s = ctx->priv;                                     \
    AVFilterLink *inlink = ctx->inputs[0];                                      \
                                                                                \
    for (int ch = 0; ch < inlink->ch_layout.nb_channels; ch++) {                \
        ChannelContext *cc = &s->cc[ch];                                        \
        const ptype *src = (const ptype *)in->extended_data[ch];                \
        ptype *dst = (ptype *)out->extended_data[ch];                           \
        enum AVChannel channel = av_channel_layout_channel_from_index(&inlink->ch_layout, ch); \
        const int bypass = av_channel_layout_index_from_channel(&s->ch_layout, channel) < 0; \
        int n = 0;                                                              \
                                                                                \
        while (n < nb_samples) {                                                \
            ptype gain;                                                         \
            int size;                                                           \
                                                                                \
            next_pi(ctx, cc, bypass);                                           \
            size = FFMIN(nb_samples - n, cc->pi_size);                          \
            av_assert1(size > 0);                                               \
            gain = cc->gain_state;                                              \
            consume_pi(cc, size);                                               \
            for (int i = n; !ctx->is_disabled && i < n + size; i++)             \
                dst[i] = src[i] * gain;                                         \
            n += size;                                                          \
        }                                                                       \
    }                                                                           \
}

Definition at line 314 of file af_speechnorm.c.

◆ FILTER_LINK_CHANNELS

#define FILTER_LINK_CHANNELS	(	name,
		ptype,
		tlerp
	)

Definition at line 358 of file af_speechnorm.c.

Function Documentation

◆ AVFILTER_DEFINE_CLASS()

AVFILTER_DEFINE_CLASS ( speechnorm )

◆ get_pi_samples()

static int get_pi_samples	(	PeriodItem *	pi,
		int	start,
		int	end,
		int	remain
	)

static

Definition at line 123 of file af_speechnorm.c.

Referenced by available_samples().

◆ available_samples()

static int available_samples ( AVFilterContext * ctx )

static

Definition at line 144 of file af_speechnorm.c.

Referenced by activate(), and filter_frame().

◆ consume_pi()

static void consume_pi	(	ChannelContext *	cc,
		int	nb_samples
	)

static

Definition at line 160 of file af_speechnorm.c.

◆ next_gain()

static double next_gain	(	AVFilterContext *	ctx,
		double	pi_max_peak,
		int	bypass,
		double	state,
		double	pi_rms_sum,
		int	pi_size
	)

static

Definition at line 169 of file af_speechnorm.c.

Referenced by min_gain(), and next_pi().

◆ next_pi()

static void next_pi	(	AVFilterContext *	ctx,
		ChannelContext *	cc,
		int	bypass
	)

static

Definition at line 189 of file af_speechnorm.c.

◆ min_gain()

static double min_gain	(	AVFilterContext *	ctx,
		ChannelContext *	cc,
		int	max_size
	)

static

Definition at line 211 of file af_speechnorm.c.

◆ dlerp()

static double dlerp	(	double	min,
		double	max,
		double	mix
	)

static

Definition at line 348 of file af_speechnorm.c.

◆ flerp()

static float flerp	(	float	min,
		float	max,
		float	mix
	)

static

Definition at line 353 of file af_speechnorm.c.

◆ filter_frame()

static int filter_frame ( AVFilterContext * ctx )

static

Definition at line 413 of file af_speechnorm.c.

Referenced by activate().

◆ activate()

static int activate ( AVFilterContext * ctx )

static

Definition at line 476 of file af_speechnorm.c.

◆ config_input()

static int config_input ( AVFilterLink * inlink )

static

Definition at line 523 of file af_speechnorm.c.

◆ process_command()

static int process_command	(	AVFilterContext *	ctx,
		const char *	cmd,
		const char *	args,
		char *	res,
		int	res_len,
		int	flags
	)

static

Definition at line 560 of file af_speechnorm.c.

◆ uninit()

static av_cold void uninit ( AVFilterContext * ctx )

static

Definition at line 576 of file af_speechnorm.c.

Variable Documentation

◆ speechnorm_options

const AVOption speechnorm_options[]

static

Initial value:

= {
    { "peak", "set the peak value", OFFSET(peak_value), AV_OPT_TYPE_DOUBLE, {.dbl=0.95}, 0.0, 1.0, FLAGS },
    { "p",    "set the peak value", OFFSET(peak_value), AV_OPT_TYPE_DOUBLE, {.dbl=0.95}, 0.0, 1.0, FLAGS },
    { "expansion", "set the max expansion factor", OFFSET(max_expansion), AV_OPT_TYPE_DOUBLE, {.dbl=2.0}, 1.0, 50.0, FLAGS },
    { "e",         "set the max expansion factor", OFFSET(max_expansion), AV_OPT_TYPE_DOUBLE, {.dbl=2.0}, 1.0, 50.0, FLAGS },
    { "compression", "set the max compression factor", OFFSET(max_compression), AV_OPT_TYPE_DOUBLE, {.dbl=2.0}, 1.0, 50.0, FLAGS },
    { "c",           "set the max compression factor", OFFSET(max_compression), AV_OPT_TYPE_DOUBLE, {.dbl=2.0}, 1.0, 50.0, FLAGS },
    { "threshold", "set the threshold value", OFFSET(threshold_value), AV_OPT_TYPE_DOUBLE, {.dbl=0}, 0.0, 1.0, FLAGS },
    { "t",         "set the threshold value", OFFSET(threshold_value), AV_OPT_TYPE_DOUBLE, {.dbl=0}, 0.0, 1.0, FLAGS },
    { "raise", "set the expansion raising amount", OFFSET(raise_amount), AV_OPT_TYPE_DOUBLE, {.dbl=0.001}, 0.0, 1.0, FLAGS },
    { "r",     "set the expansion raising amount", OFFSET(raise_amount), AV_OPT_TYPE_DOUBLE, {.dbl=0.001}, 0.0, 1.0, FLAGS },
    { "fall", "set the compression raising amount", OFFSET(fall_amount), AV_OPT_TYPE_DOUBLE, {.dbl=0.001}, 0.0, 1.0, FLAGS },
    { "f",    "set the compression raising amount", OFFSET(fall_amount), AV_OPT_TYPE_DOUBLE, {.dbl=0.001}, 0.0, 1.0, FLAGS },
    { "channels", "set channels to filter", OFFSET(ch_layout_str), AV_OPT_TYPE_STRING, {.str="all"}, 0, 0, FLAGS },
    { "h",        "set channels to filter", OFFSET(ch_layout_str), AV_OPT_TYPE_STRING, {.str="all"}, 0, 0, FLAGS },
    { "invert", "set inverted filtering", OFFSET(invert), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, FLAGS },
    { "i",      "set inverted filtering", OFFSET(invert), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, FLAGS },
    { "link", "set linked channels filtering", OFFSET(link), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, FLAGS },
    { "l",    "set linked channels filtering", OFFSET(link), AV_OPT_TYPE_BOOL, {.i64=0}, 0, 1, FLAGS },
    { "rms", "set the RMS value", OFFSET(rms_value), AV_OPT_TYPE_DOUBLE, {.dbl=0.0}, 0.0, 1.0, FLAGS },
    { "m",   "set the RMS value", OFFSET(rms_value), AV_OPT_TYPE_DOUBLE, {.dbl=0.0}, 0.0, 1.0, FLAGS },
    { NULL }
}

Definition at line 97 of file af_speechnorm.c.

◆ inputs

const AVFilterPad inputs[]

static

Initial value:

= {
    {
        .name         = "default",
        .type         = AVMEDIA_TYPE_AUDIO,
        .config_props = config_input,
    },
}

Definition at line 585 of file af_speechnorm.c.

◆ ff_af_speechnorm

const FFFilter ff_af_speechnorm

Initial value:

= {
    .p.name          = "speechnorm",
    .p.description   = NULL_IF_CONFIG_SMALL("Speech Normalizer."),
    .p.priv_class    = &speechnorm_class,
    .p.flags         = AVFILTER_FLAG_SUPPORT_TIMELINE_INTERNAL,
    .priv_size       = sizeof(SpeechNormalizerContext),
    .activate        = activate,
    .uninit          = uninit,
    FILTER_INPUTS(inputs),
    FILTER_OUTPUTS(ff_audio_default_filterpad),
    FILTER_SAMPLEFMTS(AV_SAMPLE_FMT_FLTP, AV_SAMPLE_FMT_DBLP),
    .process_command = process_command,
}

Definition at line 593 of file af_speechnorm.c.

Data Structures

Macros

Functions

Variables

Detailed Description

Macro Definition Documentation

◆ FF_BUFQUEUE_SIZE

◆ MAX_ITEMS

◆ MIN_PEAK

◆ OFFSET

◆ FLAGS

◆ ANALYZE_CHANNEL

◆ FILTER_CHANNELS

◆ FILTER_LINK_CHANNELS

Function Documentation

◆ AVFILTER_DEFINE_CLASS()

◆ get_pi_samples()

◆ available_samples()

◆ consume_pi()

◆ next_gain()

◆ next_pi()

◆ min_gain()

◆ dlerp()

◆ flerp()

◆ filter_frame()

◆ activate()

◆ config_input()

◆ process_command()

◆ uninit()

Variable Documentation

◆ speechnorm_options

◆ inputs

◆ ff_af_speechnorm