FFmpeg
nellymoserdec.c
Go to the documentation of this file.
1 /*
2  * NellyMoser audio decoder
3  * Copyright (c) 2007 a840bda5870ba11f19698ff6eb9581dfb0f95fa5,
4  * 539459aeb7d425140b62a3ec7dbf6dc8e408a306, and
5  * 520e17cd55896441042b14df2566a6eb610ed444
6  * Copyright (c) 2007 Loic Minier <lool at dooz.org>
7  * Benjamin Larsson
8  *
9  * Permission is hereby granted, free of charge, to any person obtaining a
10  * copy of this software and associated documentation files (the "Software"),
11  * to deal in the Software without restriction, including without limitation
12  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
13  * and/or sell copies of the Software, and to permit persons to whom the
14  * Software is furnished to do so, subject to the following conditions:
15  *
16  * The above copyright notice and this permission notice shall be included in
17  * all copies or substantial portions of the Software.
18  *
19  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
20  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
21  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
22  * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
23  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
24  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
25  * DEALINGS IN THE SOFTWARE.
26  */
27 
28 /**
29  * @file
30  * The 3 alphanumeric copyright notices are md5summed they are from the original
31  * implementors. The original code is available from http://code.google.com/p/nelly2pcm/
32  */
33 
35 #include "libavutil/float_dsp.h"
36 #include "libavutil/lfg.h"
37 #include "libavutil/mem_internal.h"
38 #include "libavutil/tx.h"
39 
40 #define BITSTREAM_READER_LE
41 #include "avcodec.h"
42 #include "codec_internal.h"
43 #include "decode.h"
44 #include "get_bits.h"
45 #include "nellymoser.h"
46 #include "sinewin.h"
47 
48 
49 typedef struct NellyMoserDecodeContext {
53  float scale_bias;
58  float *imdct_out;
59  float *imdct_prev;
61 
63  const unsigned char block[NELLY_BLOCK_LEN],
64  float audio[NELLY_SAMPLES])
65 {
66  int i,j;
67  float buf[NELLY_FILL_LEN], pows[NELLY_FILL_LEN];
68  float *aptr, *bptr, *pptr, val, pval;
69  int bits[NELLY_BUF_LEN];
70  unsigned char v;
71 
73 
74  bptr = buf;
75  pptr = pows;
76  val = ff_nelly_init_table[get_bits(&s->gb, 6)];
77  for (i=0 ; i<NELLY_BANDS ; i++) {
78  if (i > 0)
79  val += ff_nelly_delta_table[get_bits(&s->gb, 5)];
80  pval = -exp2(val/2048) * s->scale_bias;
81  for (j = 0; j < ff_nelly_band_sizes_table[i]; j++) {
82  *bptr++ = val;
83  *pptr++ = pval;
84  }
85 
86  }
87 
89 
90  for (i = 0; i < 2; i++) {
91  aptr = audio + i * NELLY_BUF_LEN;
92 
95 
96  for (j = 0; j < NELLY_FILL_LEN; j++) {
97  if (bits[j] <= 0) {
98  aptr[j] = M_SQRT1_2*pows[j];
99  if (av_lfg_get(&s->random_state) & 1)
100  aptr[j] *= -1.0;
101  } else {
102  v = get_bits(&s->gb, bits[j]);
103  aptr[j] = ff_nelly_dequantization_table[(1<<bits[j])-1+v]*pows[j];
104  }
105  }
106  memset(&aptr[NELLY_FILL_LEN], 0,
107  (NELLY_BUF_LEN - NELLY_FILL_LEN) * sizeof(float));
108 
109  s->imdct_fn(s->imdct_ctx, s->imdct_out, aptr, sizeof(float));
110  s->fdsp->vector_fmul_window(aptr, s->imdct_prev + NELLY_BUF_LEN / 2,
111  s->imdct_out, ff_sine_128,
112  NELLY_BUF_LEN / 2);
113  FFSWAP(float *, s->imdct_out, s->imdct_prev);
114  }
115 }
116 
117 static av_cold int decode_init(AVCodecContext * avctx)
118 {
119  int ret;
120  float scale = 1.0f;
122 
123  s->avctx = avctx;
124  s->imdct_out = s->imdct_buf[0];
125  s->imdct_prev = s->imdct_buf[1];
126  av_lfg_init(&s->random_state, 0);
127  if ((ret = av_tx_init(&s->imdct_ctx, &s->imdct_fn, AV_TX_FLOAT_MDCT,
128  1, 128, &scale, 0)) < 0)
129  return ret;
130 
132  if (!s->fdsp)
133  return AVERROR(ENOMEM);
134 
135  s->scale_bias = 1.0/(32768*8);
136  avctx->sample_fmt = AV_SAMPLE_FMT_FLT;
137 
140 
141  /* Generate overlap window */
143 
144  return 0;
145 }
146 
148  int *got_frame_ptr, AVPacket *avpkt)
149 {
150  const uint8_t *buf = avpkt->data;
151  int buf_size = avpkt->size;
153  int blocks, i, ret;
154  float *samples_flt;
155 
156  blocks = buf_size / NELLY_BLOCK_LEN;
157 
158  if (blocks <= 0) {
159  av_log(avctx, AV_LOG_ERROR, "Packet is too small\n");
160  return AVERROR_INVALIDDATA;
161  }
162 
163  if (buf_size % NELLY_BLOCK_LEN) {
164  av_log(avctx, AV_LOG_WARNING, "Leftover bytes: %d.\n",
165  buf_size % NELLY_BLOCK_LEN);
166  }
167 
168  /* get output buffer */
169  frame->nb_samples = NELLY_SAMPLES * blocks;
170  if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
171  return ret;
172  samples_flt = (float *)frame->data[0];
173 
174  for (i=0 ; i<blocks ; i++) {
175  nelly_decode_block(s, buf, samples_flt);
176  samples_flt += NELLY_SAMPLES;
177  buf += NELLY_BLOCK_LEN;
178  }
179 
180  *got_frame_ptr = 1;
181 
182  return buf_size;
183 }
184 
185 static av_cold int decode_end(AVCodecContext * avctx) {
187 
188  av_tx_uninit(&s->imdct_ctx);
189  av_freep(&s->fdsp);
190 
191  return 0;
192 }
193 
195  .p.name = "nellymoser",
196  CODEC_LONG_NAME("Nellymoser Asao"),
197  .p.type = AVMEDIA_TYPE_AUDIO,
198  .p.id = AV_CODEC_ID_NELLYMOSER,
199  .priv_data_size = sizeof(NellyMoserDecodeContext),
200  .init = decode_init,
201  .close = decode_end,
204  .p.sample_fmts = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLT,
206 };
skip_bits_long
static void skip_bits_long(GetBitContext *s, int n)
Skips the specified number of bits.
Definition: get_bits.h:278
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
NELLY_HEADER_BITS
#define NELLY_HEADER_BITS
Definition: nellymoser.h:41
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
mem_internal.h
decode_init
static av_cold int decode_init(AVCodecContext *avctx)
Definition: nellymoserdec.c:117
av_lfg_init
av_cold void av_lfg_init(AVLFG *c, unsigned int seed)
Definition: lfg.c:32
nellymoser.h
AVTXContext
Definition: tx_priv.h:235
NELLY_FILL_LEN
#define NELLY_FILL_LEN
Definition: nellymoser.h:44
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:344
AVPacket::data
uint8_t * data
Definition: packet.h:522
NELLY_BLOCK_LEN
#define NELLY_BLOCK_LEN
Definition: nellymoser.h:40
FFCodec
Definition: codec_internal.h:127
init_get_bits
static int init_get_bits(GetBitContext *s, const uint8_t *buffer, int bit_size)
Initialize GetBitContext.
Definition: get_bits.h:514
av_tx_init
av_cold int av_tx_init(AVTXContext **ctx, av_tx_fn *tx, enum AVTXType type, int inv, int len, const void *scale, uint64_t flags)
Initialize a transform context with the given configuration (i)MDCTs with an odd length are currently...
Definition: tx.c:902
ff_nellymoser_decoder
const FFCodec ff_nellymoser_decoder
Definition: nellymoserdec.c:194
AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:365
get_bits
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:335
FFCodec::p
AVCodec p
The public AVCodec.
Definition: codec_internal.h:131
AVCodecContext::ch_layout
AVChannelLayout ch_layout
Audio channel layout.
Definition: avcodec.h:1065
ff_nelly_band_sizes_table
const uint8_t ff_nelly_band_sizes_table[NELLY_BANDS]
Definition: nellymoser.c:68
GetBitContext
Definition: get_bits.h:108
AVCodecContext::flags
int flags
AV_CODEC_FLAG_*.
Definition: avcodec.h:502
val
static double val(void *priv, double ch)
Definition: aeval.c:78
ff_nelly_dequantization_table
const float ff_nelly_dequantization_table[127]
Definition: nellymoser.c:41
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
av_cold
#define av_cold
Definition: attributes.h:90
av_tx_fn
void(* av_tx_fn)(AVTXContext *s, void *out, void *in, ptrdiff_t stride)
Function pointer to a function to perform the transform.
Definition: tx.h:151
AV_TX_FLOAT_MDCT
@ AV_TX_FLOAT_MDCT
Standard MDCT with a sample data type of float, double or int32_t, respecively.
Definition: tx.h:68
FF_CODEC_DECODE_CB
#define FF_CODEC_DECODE_CB(func)
Definition: codec_internal.h:287
s
#define s(width, name)
Definition: cbs_vp9.c:198
av_lfg_get
static unsigned int av_lfg_get(AVLFG *c)
Get the next random unsigned 32-bit number using an ALFG.
Definition: lfg.h:53
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
NELLY_BANDS
#define NELLY_BANDS
Definition: nellymoser.h:39
lfg.h
bits
uint8_t bits
Definition: vp3data.h:128
decode.h
get_bits.h
ff_nelly_init_table
const uint16_t ff_nelly_init_table[64]
Definition: nellymoser.c:72
NellyMoserDecodeContext::imdct_prev
float * imdct_prev
Definition: nellymoserdec.c:59
CODEC_LONG_NAME
#define CODEC_LONG_NAME(str)
Definition: codec_internal.h:272
frame
static AVFrame * frame
Definition: demux_decode.c:54
ff_nelly_delta_table
const int16_t ff_nelly_delta_table[32]
Definition: nellymoser.c:81
NellyMoserDecodeContext::random_state
AVLFG random_state
Definition: nellymoserdec.c:51
NellyMoserDecodeContext::imdct_buf
float imdct_buf[2][NELLY_BUF_LEN]
Definition: nellymoserdec.c:57
NELLY_DETAIL_BITS
#define NELLY_DETAIL_BITS
Definition: nellymoser.h:42
NellyMoserDecodeContext
Definition: nellymoserdec.c:49
decode_end
static av_cold int decode_end(AVCodecContext *avctx)
Definition: nellymoserdec.c:185
NellyMoserDecodeContext::imdct_ctx
AVTXContext * imdct_ctx
Definition: nellymoserdec.c:55
float_dsp.h
AV_CODEC_CAP_CHANNEL_CONF
#define AV_CODEC_CAP_CHANNEL_CONF
Codec should fill in channel configuration and samplerate instead of container.
Definition: codec.h:106
AVLFG
Context structure for the Lagged Fibonacci PRNG.
Definition: lfg.h:33
ff_get_buffer
int ff_get_buffer(AVCodecContext *avctx, AVFrame *frame, int flags)
Get a buffer for a frame.
Definition: decode.c:1569
init
int(* init)(AVBSFContext *ctx)
Definition: dts2pts.c:365
AV_CODEC_CAP_DR1
#define AV_CODEC_CAP_DR1
Codec uses get_buffer() or get_encode_buffer() for allocating buffers and supports custom allocators.
Definition: codec.h:52
AVPacket::size
int size
Definition: packet.h:523
scale
static void scale(int *out, const int *in, const int w, const int h, const int shift)
Definition: vvc_intra.c:291
AVChannelLayout
An AVChannelLayout holds information about the channel layout of audio data.
Definition: channel_layout.h:303
codec_internal.h
DECLARE_ALIGNED
#define DECLARE_ALIGNED(n, t, v)
Definition: mem_internal.h:109
NellyMoserDecodeContext::fdsp
AVFloatDSPContext * fdsp
Definition: nellymoserdec.c:54
for
for(k=2;k<=8;++k)
Definition: h264pred_template.c:425
AVCodecContext::sample_fmt
enum AVSampleFormat sample_fmt
audio sample format
Definition: avcodec.h:1057
AV_SAMPLE_FMT_NONE
@ AV_SAMPLE_FMT_NONE
Definition: samplefmt.h:56
NELLY_BUF_LEN
#define NELLY_BUF_LEN
Definition: nellymoser.h:43
AVFloatDSPContext
Definition: float_dsp.h:22
sinewin.h
NellyMoserDecodeContext::imdct_fn
av_tx_fn imdct_fn
Definition: nellymoserdec.c:56
av_tx_uninit
av_cold void av_tx_uninit(AVTXContext **ctx)
Frees a context and sets *ctx to NULL, does nothing when *ctx == NULL.
Definition: tx.c:294
NellyMoserDecodeContext::imdct_out
float * imdct_out
Definition: nellymoserdec.c:58
NELLY_SAMPLES
#define NELLY_SAMPLES
Definition: nellymoser.h:48
AVFrame::nb_samples
int nb_samples
number of audio samples (per channel) described by this frame
Definition: frame.h:424
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
AVSampleFormat
AVSampleFormat
Audio sample formats.
Definition: samplefmt.h:55
exp2
#define exp2(x)
Definition: libm.h:288
AVCodec::name
const char * name
Name of the codec implementation.
Definition: codec.h:194
NellyMoserDecodeContext::scale_bias
float scale_bias
Definition: nellymoserdec.c:53
avcodec.h
ret
ret
Definition: filter_design.txt:187
NellyMoserDecodeContext::gb
GetBitContext gb
Definition: nellymoserdec.c:52
FFSWAP
#define FFSWAP(type, a, b)
Definition: macros.h:52
decode_tag
static int decode_tag(AVCodecContext *avctx, AVFrame *frame, int *got_frame_ptr, AVPacket *avpkt)
Definition: nellymoserdec.c:147
NellyMoserDecodeContext::avctx
AVCodecContext * avctx
Definition: nellymoserdec.c:50
M_SQRT1_2
#define M_SQRT1_2
Definition: mathematics.h:103
AVCodecContext
main external API structure.
Definition: avcodec.h:445
channel_layout.h
ff_init_ff_sine_windows
void ff_init_ff_sine_windows(int index)
initialize the specified entry of ff_sine_windows
Definition: sinewin_tablegen.h:101
av_channel_layout_uninit
void av_channel_layout_uninit(AVChannelLayout *channel_layout)
Free any allocated data in the channel layout and reset the channel count to 0.
Definition: channel_layout.c:432
nelly_decode_block
static void nelly_decode_block(NellyMoserDecodeContext *s, const unsigned char block[NELLY_BLOCK_LEN], float audio[NELLY_SAMPLES])
Definition: nellymoserdec.c:62
AV_CODEC_CAP_PARAM_CHANGE
#define AV_CODEC_CAP_PARAM_CHANGE
Codec supports changed parameters at any point.
Definition: codec.h:118
AV_CODEC_FLAG_BITEXACT
#define AV_CODEC_FLAG_BITEXACT
Use only bitexact stuff (except (I)DCT).
Definition: avcodec.h:342
AV_CHANNEL_LAYOUT_MONO
#define AV_CHANNEL_LAYOUT_MONO
Definition: channel_layout.h:378
AVPacket
This structure stores compressed data.
Definition: packet.h:499
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:472
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:34
avpriv_float_dsp_alloc
av_cold AVFloatDSPContext * avpriv_float_dsp_alloc(int bit_exact)
Allocate a float DSP context.
Definition: float_dsp.c:135
block
The exact code depends on how similar the blocks are and how related they are to the block
Definition: filter_design.txt:207
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
AV_SAMPLE_FMT_FLT
@ AV_SAMPLE_FMT_FLT
float
Definition: samplefmt.h:60
AV_CODEC_ID_NELLYMOSER
@ AV_CODEC_ID_NELLYMOSER
Definition: codec_id.h:473
tx.h
ff_nelly_get_sample_bits
void ff_nelly_get_sample_bits(const float *buf, int *bits)
Definition: nellymoser.c:118