36 #define MAX_CHANNELS 6
37 #define DCA_MAX_FRAME_SIZE 16384
38 #define DCA_HEADER_SIZE 13
39 #define DCA_LFE_SAMPLES 8
41 #define DCAENC_SUBBANDS 32
43 #define SUBSUBFRAMES 2
44 #define SUBBAND_SAMPLES (SUBFRAMES * SUBSUBFRAMES * 8)
89 static double hom(
double f)
93 return -3.64 * pow(f1, -0.8)
94 + 6.8 *
exp(-0.6 * (f1 - 3.4) * (f1 - 3.4))
95 - 6.0 *
exp(-0.15 * (f1 - 8.7) * (f1 - 8.7))
96 - 0.0006 * (f1 * f1) * (f1 * f1);
101 double h = (f -
fc[i]) /
erb[i];
105 return 20 * log10(h);
112 int i, min_frame_bits;
123 "encoder will guess the layout, but it "
124 "might be incorrect.\n");
145 for (i = 0; i < 9; i++) {
175 for (i = 1; i < 512; i++) {
181 for (i = 0; i < 2048; i++) {
185 for (k = 0; k < 32; k++) {
186 for (j = 0; j < 8; j++) {
192 for (i = 0; i < 512; i++) {
197 for (i = 0; i < 9; i++) {
198 for (j = 0; j <
AUBANDS; j++) {
199 for (k = 0; k < 256; k++) {
207 for (i = 0; i < 256; i++) {
208 double add = 1 +
ff_exp10(-0.01 * i);
211 for (j = 0; j < 8; j++) {
213 for (i = 0; i < 512; i++) {
215 accum += reconst * cos(2 *
M_PI * (i + 0.5 - 256) * (j + 0.5) / 512);
219 for (j = 0; j < 8; j++) {
221 for (i = 0; i < 512; i++) {
223 accum += reconst * cos(2 *
M_PI * (i + 0.5 - 256) * (j + 0.5) / 512);
238 return cos_t(x - 512);
248 int64_t
r = (int64_t)a * b + 0x80000000ULL;
254 int ch, subs, i, k, j;
262 for (i = 0; i < 512; i++)
271 for (i = 0; i < 64; i++)
274 for (k = 0, i = hist_start, j = 0;
275 i < 512; k = (k + 1) & 63, i++, j++)
277 for (i = 0; i < hist_start; k = (k + 1) & 63, i++, j++)
280 for (k = 16; k < 32; k++)
281 accum[k] = accum[k] - accum[31 - k];
282 for (k = 32; k < 48; k++)
283 accum[k] = accum[k] + accum[95 - k];
285 for (band = 0; band < 32; band++) {
287 for (i = 16; i < 48; i++) {
288 int s = (2 * band + 1) * (2 * (i + 16) + 1);
292 c->
subband[subs][
band][ch] = ((band + 1) & 2) ? -resp : resp;
296 for (i = 0; i < 32; i++)
297 hist[i + hist_start] = input[(subs * 32 + i) * c->
channels + chi];
298 hist_start = (hist_start + 32) & 511;
312 for (i = 0; i < 512; i++)
319 for (i = hist_start, j = 0; i < 512; i++, j++)
321 for (i = 0; i < hist_start; i++, j++)
327 for (i = 0; i < 64; i++)
328 hist[i + hist_start] = input[(lfes * 64 + i) * c->
channels + lfech];
330 hist_start = (hist_start + 64) & 511;
345 for (i = 0; i < 256; i++) {
347 rin[i].
re =
mul32(in[2 * i], 0x3fffffff - (
cos_t(8 * i + 2) >> 1));
348 rin[i].
im =
mul32(in[2 * i + 1], 0x3fffffff - (
cos_t(8 * i + 6) >> 1));
351 for (i = 0; i < 256; i++) {
358 for (j = 256, l = 1; j != 1; j >>= 1, l <<= 1) {
359 for (k = 0; k < 256; k += j) {
360 for (i = k; i < k + j / 2; i++) {
364 sum.
re = buf[i].
re + buf[i + j / 2].
re;
365 sum.
im = buf[i].
im + buf[i + j / 2].
im;
367 diff.
re = buf[i].
re - buf[i + j / 2].
re;
368 diff.
im = buf[i].
im - buf[i + j / 2].
im;
381 for (i = 0; i < 256; i++) {
388 for (i = 0; i < 256; i++) {
392 o1.
re = rout[i].
re - rout[255 - i].
re;
393 o1.
im = rout[i].
im + rout[255 - i].
im;
395 o2.
re = rout[i].
im - rout[255 - i].
im;
396 o2.
im = -rout[i].
re - rout[255 - i].
re;
413 for (i = 1024; i > 0; i >>= 1) {
443 for (j = 0; j < 256; j++) {
445 out_cb_unnorm[j] = -2047;
448 for (i = 0; i <
AUBANDS; i++) {
450 for (j = 0; j < 256; j++)
451 denom =
add_cb(denom, power[j] +
auf[samplerate_index][i][j]);
452 for (j = 0; j < 256; j++)
453 out_cb_unnorm[j] =
add_cb(out_cb_unnorm[j],
454 -denom +
auf[samplerate_index][i][j]);
457 for (j = 0; j < 256; j++)
458 out_cb[j] =
add_cb(out_cb[j], -out_cb_unnorm[j] - ca_cb - cs_cb);
471 for (f = 0; f < 4; f++)
472 walk(c, 0, 0, f, 0, -2047, channel, arg);
474 for (f = 0; f < 8; f++)
475 walk(c, band, band - 1, 8 * band - 4 + f,
486 for (f = 0; f < 4; f++)
487 walk(c, 31, 31, 256 - 4 + f, 0, -2047, channel, arg);
489 for (f = 0; f < 8; f++)
490 walk(c, band, band + 1, 8 * band + 4 + f,
507 int i, k,
band, ch, ssf;
510 for (i = 0; i < 256; i++)
518 for (i = 0, k = 128 + 256 * ssf; k < 512; i++, k++)
520 for (k -= 512; i < 512; i++, k++)
521 data[i] = input[k * c->
channels + chi];
524 for (i = 0; i < 256; i++) {
533 for (band = 0; band < 32; band++) {
544 for (band = 0; band < 32; band++)
569 #define USED_1ABITS 1
570 #define USED_NABITS 2
571 #define USED_26ABITS 4
575 int ch,
band, ret = 0;
583 for (band = 0; band < 32; band++) {
586 if (snr_cb >= 1312) {
589 }
else if (snr_cb >= 222) {
592 }
else if (snr_cb >= 0) {
602 for (band = 0; band < 32; band++)
636 for (down =
snr_fudge >> 1; down; down >>= 1) {
652 for (k = 0; k < 512; k++)
653 for (ch = 0; ch < c->
channels; ch++) {
665 value = value >> quant.
e;
672 int our_nscale, try_remove;
681 for (try_remove = 64; try_remove > 0; try_remove >>= 1) {
688 our_nscale -= try_remove;
691 if (our_nscale >= 125)
705 for (band = 0; band < 32; band++)
709 &c->
quant[band][ch]);
720 for (band = 0; band < 32; band++)
810 static const int bitlen[11] = { 0, 1, 2, 2, 2, 2, 3, 3, 3, 3, 3 };
811 static const int thr[11] = { 0, 1, 3, 3, 3, 3, 7, 7, 7, 7, 7 };
846 for (i = 1; i < 11; i++)
856 if (c->
abits[band][ch] <= 7) {
858 for (i = 0; i < 8; i += 4) {
860 for (j = 3; j >= 0; j--) {
869 for (i = 0; i < 8; i++) {
This structure describes decoded (raw) audio or video data.
static int32_t cb_to_add[256]
static int noise(AVBSFContext *ctx, AVPacket *out)
ptrdiff_t const GLvoid * data
int32_t eff_masking_curve_cb[256]
static void put_sbits(PutBitContext *pb, int n, int32_t value)
static int32_t auf[9][AUBANDS][256]
static void put_bits(Jpeg2000EncoderContext *s, int val, int n)
put n times val bit
#define AV_LOG_WARNING
Something somehow does not look correct.
static void put_frame_header(DCAEncContext *c)
int64_t bit_rate
the average bitrate
static av_cold int init(AVCodecContext *avctx)
const int8_t * channel_order_tab
channel reordering table, lfe and non lfe
static int32_t band_spectrum[2][8]
static const uint8_t bitstream_sfreq[]
static const uint16_t erb[]
#define AV_CODEC_CAP_EXPERIMENTAL
Codec is experimental and is thus avoided in favor of non experimental encoders.
static void shift_history(DCAEncContext *c, const int32_t *input)
#define AV_CH_LAYOUT_STEREO
static int encode_frame(AVCodecContext *avctx, AVPacket *avpkt, const AVFrame *frame, int *got_packet_ptr)
static void walk_band_high(DCAEncContext *c, int band, int channel, walk_band_t walk, int32_t *arg)
#define AV_CH_LAYOUT_5POINT0
int32_t subband[SUBBAND_SAMPLES][DCAENC_SUBBANDS][MAX_CHANNELS]
const float ff_dca_fir_32bands_nonperfect[512]
static void walk_band_low(DCAEncContext *c, int band, int channel, walk_band_t walk, int32_t *arg)
#define av_assert0(cond)
assert() equivalent, that is always enabled.
static void calc_masking(DCAEncContext *c, const int32_t *input)
static const softfloat stepsize_inv[27]
const uint32_t ff_dca_bit_rates[32]
static int32_t lfe_fir_64i[512]
int64_t duration
Duration of this packet in AVStream->time_base units, 0 if unknown.
static int32_t cos_table[2048]
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
static int calc_one_scale(int32_t peak_cb, int abits, softfloat *quant)
int scale_factor[DCAENC_SUBBANDS][MAX_CHANNELS]
int32_t history[512][MAX_CHANNELS]
int32_t masking_curve_cb[SUBSUBFRAMES][256]
static void quantize_all(DCAEncContext *c)
static int32_t sin_t(int x)
#define AV_CH_LAYOUT_5POINT1
static int32_t add_cb(int32_t a, int32_t b)
static const softfloat scalefactor_inv[128]
static void lfe_downsample(DCAEncContext *c, const int32_t *input)
softfloat quant[DCAENC_SUBBANDS][MAX_CHANNELS]
static double hom(double f)
int32_t band_masking_cb[32]
static av_always_inline double ff_exp10(double x)
Compute 10^x for floating point values.
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
static void put_subframe(DCAEncContext *c, int subframe)
static const int snr_fudge
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
const uint8_t ff_reverse[256]
int abits[DCAENC_SUBBANDS][MAX_CHANNELS]
const float ff_dca_lfe_fir_64[256]
static void update_band_masking(DCAEncContext *c, int band1, int band2, int f, int32_t spectrum1, int32_t spectrum2, int channel, int32_t *arg)
simple assert() macros that are a bit more flexible than ISO C assert().
const char * name
Name of the codec implementation.
const uint32_t ff_dca_quant_levels[32]
static const uint8_t offset[127][2]
static int32_t quantize_value(int32_t value, softfloat quant)
static const int sample_rates[]
uint64_t channel_layout
Audio channel layout.
static int put_bits_count(PutBitContext *s)
static const uint16_t fc[]
static void assign_bits(DCAEncContext *c)
audio channel layout utility functions
static int init_quantization_noise(DCAEncContext *c, int noise)
typedef void(APIENTRY *FF_PFNGLACTIVETEXTUREPROC)(GLenum texture)
GLsizei GLboolean const GLfloat * value
#define DCA_MAX_FRAME_SIZE
#define AVERROR_PATCHWELCOME
Not yet implemented in FFmpeg, patches welcome.
int32_t quantized[SUBBAND_SAMPLES][DCAENC_SUBBANDS][MAX_CHANNELS]
int32_t peak_cb[DCAENC_SUBBANDS][MAX_CHANNELS]
int frame_size
Number of samples per channel in an audio frame.
static const int8_t channel_reorder_lfe[7][5]
static void put_primary_audio_header(DCAEncContext *c)
static void find_peaks(DCAEncContext *c)
static int32_t mul32(int32_t a, int32_t b)
Libavcodec external API header.
const int32_t * band_spectrum
AVSampleFormat
Audio sample formats.
static int32_t cb_to_level[2048]
int sample_rate
samples per second
main external API structure.
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(constint16_t *) pi >>8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(constint32_t *) pi >>24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(constfloat *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(constfloat *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(constfloat *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(constdouble *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(constdouble *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(constdouble *) pi *(1U<< 31))))#defineSET_CONV_FUNC_GROUP(ofmt, ifmt) staticvoidset_generic_function(AudioConvert *ac){}voidff_audio_convert_free(AudioConvert **ac){if(!*ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);}AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enumAVSampleFormatout_fmt, enumAVSampleFormatin_fmt, intchannels, intsample_rate, intapply_map){AudioConvert *ac;intin_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) returnNULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method!=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt)>2){ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc){av_free(ac);returnNULL;}returnac;}in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar){ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar?ac->channels:1;}elseif(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;elseac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);returnac;}intff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in){intuse_generic=1;intlen=in->nb_samples;intp;if(ac->dc){av_log(ac->avr, AV_LOG_TRACE,"%dsamples-audio_convert:%sto%s(dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));returnff_convert_dither(ac-> in
static void put_subframe_samples(DCAEncContext *c, int ss, int band, int ch)
static void adjust_jnd(int samplerate_index, const int32_t in[512], int32_t out_cb[256])
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int64_t size, int64_t min_size)
Check AVPacket size and/or allocate data.
int32_t worst_quantization_noise
static int encode_init(AVCodecContext *avctx)
static int32_t band_interpolation[2][512]
static int32_t cos_t(int x)
static void calc_scales(DCAEncContext *c)
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
static void subband_transform(DCAEncContext *c, const int32_t *input)
internal math functions header
static void fft(const int32_t in[2 *256], cplx32 out[256])
common internal api header.
static void flush_put_bits(PutBitContext *s)
Pad the end of the output stream with zeros.
common internal and external API header
static int32_t get_cb(int32_t in)
static void init_put_bits(PutBitContext *s, uint8_t *buffer, int buffer_size)
Initialize the PutBitContext s.
static av_always_inline int diff(const uint32_t a, const uint32_t b)
int channels
number of audio channels
void(* walk_band_t)(DCAEncContext *c, int band1, int band2, int f, int32_t spectrum1, int32_t spectrum2, int channel, int32_t *arg)
static int32_t half32(int32_t a)
static const int8_t channel_reorder_nolfe[7][5]
int64_t av_get_default_channel_layout(int nb_channels)
Return default channel layout for a given number of channels.
static enum AVSampleFormat sample_fmts[]
const int32_t * band_interpolation
int32_t downsampled_lfe[DCA_LFE_SAMPLES]
static av_always_inline int64_t ff_samples_to_time_base(AVCodecContext *avctx, int64_t samples)
Rescale from sample rate to AVCodecContext.time_base.
#define FFSWAP(type, a, b)
static const AVCodecDefault defaults[]
static const uint8_t lfe_index[7]
static const int bit_consumption[27]
const float ff_dca_fir_32bands_perfect[512]
#define AV_CH_LAYOUT_MONO
This structure stores compressed data.
int nb_samples
number of audio samples (per channel) described by this frame
static double gammafilter(int i, double f)
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...