FFmpeg
ra288.c
Go to the documentation of this file.
1 /*
2  * RealAudio 2.0 (28.8K)
3  * Copyright (c) 2003 The FFmpeg project
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
23 #include "libavutil/float_dsp.h"
24 #include "libavutil/internal.h"
25 #include "libavutil/mem_internal.h"
26 
27 #define BITSTREAM_READER_LE
28 #include "avcodec.h"
29 #include "celp_filters.h"
30 #include "codec_internal.h"
31 #include "decode.h"
32 #include "get_bits.h"
33 #include "lpc.h"
34 #include "ra288.h"
35 
36 #define MAX_BACKWARD_FILTER_ORDER 36
37 #define MAX_BACKWARD_FILTER_LEN 40
38 #define MAX_BACKWARD_FILTER_NONREC 35
39 
40 #define RA288_BLOCK_SIZE 5
41 #define RA288_BLOCKS_PER_FRAME 32
42 
43 typedef struct RA288Context {
44  void (*vector_fmul)(float *dst, const float *src0, const float *src1,
45  int len);
46  DECLARE_ALIGNED(32, float, sp_lpc)[FFALIGN(36, 16)]; ///< LPC coefficients for speech data (spec: A)
47  DECLARE_ALIGNED(32, float, gain_lpc)[FFALIGN(10, 16)]; ///< LPC coefficients for gain (spec: GB)
48 
49  /** speech data history (spec: SB).
50  * Its first 70 coefficients are updated only at backward filtering.
51  */
52  float sp_hist[111];
53 
54  /// speech part of the gain autocorrelation (spec: REXP)
55  float sp_rec[37];
56 
57  /** log-gain history (spec: SBLG).
58  * Its first 28 coefficients are updated only at backward filtering.
59  */
60  float gain_hist[38];
61 
62  /// recursive part of the gain autocorrelation (spec: REXPLG)
63  float gain_rec[11];
64 } RA288Context;
65 
67 {
68  RA288Context *ractx = avctx->priv_data;
69  AVFloatDSPContext *fdsp;
70 
74 
75  if (avctx->block_align != 38) {
76  av_log(avctx, AV_LOG_ERROR, "unsupported block align\n");
77  return AVERROR_PATCHWELCOME;
78  }
79 
81  if (!fdsp)
82  return AVERROR(ENOMEM);
83  ractx->vector_fmul = fdsp->vector_fmul;
84  av_free(fdsp);
85 
86  return 0;
87 }
88 
89 static void convolve(float *tgt, const float *src, int len, int n)
90 {
91  for (; n >= 0; n--)
92  tgt[n] = avpriv_scalarproduct_float_c(src, src - n, len);
93 
94 }
95 
96 static void decode(RA288Context *ractx, float gain, int cb_coef)
97 {
98  int i;
99  double sumsum;
100  float sum, buffer[5];
101  float *block = ractx->sp_hist + 70 + 36; // current block
102  float *gain_block = ractx->gain_hist + 28;
103 
104  memmove(ractx->sp_hist + 70, ractx->sp_hist + 75, 36*sizeof(*block));
105 
106  /* block 46 of G.728 spec */
107  sum = 32.0;
108  for (i=0; i < 10; i++)
109  sum -= gain_block[9-i] * ractx->gain_lpc[i];
110 
111  /* block 47 of G.728 spec */
112  sum = av_clipf(sum, 0, 60);
113 
114  /* block 48 of G.728 spec */
115  /* exp(sum * 0.1151292546497) == pow(10.0,sum/20) */
116  sumsum = exp(sum * 0.1151292546497) * gain * (1.0/(1<<23));
117 
118  for (i=0; i < 5; i++)
119  buffer[i] = codetable[cb_coef][i] * sumsum;
120 
122 
123  sum = FFMAX(sum, 5.0 / (1<<24));
124 
125  /* shift and store */
126  memmove(gain_block, gain_block + 1, 9 * sizeof(*gain_block));
127 
128  gain_block[9] = 10 * log10(sum) + (10*log10(((1<<24)/5.)) - 32);
129 
131 }
132 
133 /**
134  * Hybrid window filtering, see blocks 36 and 49 of the G.728 specification.
135  *
136  * @param order filter order
137  * @param n input length
138  * @param non_rec number of non-recursive samples
139  * @param out filter output
140  * @param hist pointer to the input history of the filter
141  * @param out pointer to the non-recursive part of the output
142  * @param out2 pointer to the recursive part of the output
143  * @param window pointer to the windowing function table
144  */
145 static void do_hybrid_window(RA288Context *ractx,
146  int order, int n, int non_rec, float *out,
147  float *hist, float *out2, const float *window)
148 {
149  int i;
150  float buffer1[MAX_BACKWARD_FILTER_ORDER + 1];
151  float buffer2[MAX_BACKWARD_FILTER_ORDER + 1];
155 
156  av_assert2(order>=0);
157 
158  ractx->vector_fmul(work, window, hist, FFALIGN(order + n + non_rec, 16));
159 
160  convolve(buffer1, work + order , n , order);
161  convolve(buffer2, work + order + n, non_rec, order);
162 
163  for (i=0; i <= order; i++) {
164  out2[i] = out2[i] * 0.5625 + buffer1[i];
165  out [i] = out2[i] + buffer2[i];
166  }
167 
168  /* Multiply by the white noise correcting factor (WNCF). */
169  *out *= 257.0 / 256.0;
170 }
171 
172 /**
173  * Backward synthesis filter, find the LPC coefficients from past speech data.
174  */
175 static void backward_filter(RA288Context *ractx,
176  float *hist, float *rec, const float *window,
177  float *lpc, const float *tab,
178  int order, int n, int non_rec, int move_size)
179 {
181 
182  do_hybrid_window(ractx, order, n, non_rec, temp, hist, rec, window);
183 
184  if (!compute_lpc_coefs(temp, order, lpc, 0, 1, 1))
185  ractx->vector_fmul(lpc, lpc, tab, FFALIGN(order, 16));
186 
187  memmove(hist, hist + n, move_size*sizeof(*hist));
188 }
189 
191  int *got_frame_ptr, AVPacket *avpkt)
192 {
193  const uint8_t *buf = avpkt->data;
194  int buf_size = avpkt->size;
195  float *out;
196  int i, ret;
197  RA288Context *ractx = avctx->priv_data;
198  GetBitContext gb;
199 
200  if (buf_size < avctx->block_align) {
201  av_log(avctx, AV_LOG_ERROR,
202  "Error! Input buffer is too small [%d<%d]\n",
203  buf_size, avctx->block_align);
204  return AVERROR_INVALIDDATA;
205  }
206 
207  ret = init_get_bits8(&gb, buf, avctx->block_align);
208  if (ret < 0)
209  return ret;
210 
211  /* get output buffer */
213  if ((ret = ff_get_buffer(avctx, frame, 0)) < 0)
214  return ret;
215  out = (float *)frame->data[0];
216 
217  for (i=0; i < RA288_BLOCKS_PER_FRAME; i++) {
218  float gain = amptable[get_bits(&gb, 3)];
219  int cb_coef = get_bits(&gb, 6 + (i&1));
220 
221  decode(ractx, gain, cb_coef);
222 
223  memcpy(out, &ractx->sp_hist[70 + 36], RA288_BLOCK_SIZE * sizeof(*out));
225 
226  if ((i & 7) == 3) {
227  backward_filter(ractx, ractx->sp_hist, ractx->sp_rec, syn_window,
228  ractx->sp_lpc, syn_bw_tab, 36, 40, 35, 70);
229 
230  backward_filter(ractx, ractx->gain_hist, ractx->gain_rec, gain_window,
231  ractx->gain_lpc, gain_bw_tab, 10, 8, 20, 28);
232  }
233  }
234 
235  *got_frame_ptr = 1;
236 
237  return avctx->block_align;
238 }
239 
241  .p.name = "real_288",
242  CODEC_LONG_NAME("RealAudio 2.0 (28.8K)"),
243  .p.type = AVMEDIA_TYPE_AUDIO,
244  .p.id = AV_CODEC_ID_RA_288,
245  .priv_data_size = sizeof(RA288Context),
248  .p.capabilities = AV_CODEC_CAP_DR1 | AV_CODEC_CAP_CHANNEL_CONF,
249 };
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
mem_internal.h
out
FILE * out
Definition: movenc.c:54
codetable
static const int16_t codetable[128][5]
Definition: ra288.h:34
src1
const pixel * src1
Definition: h264pred_template.c:421
ff_ra_288_decoder
const FFCodec ff_ra_288_decoder
Definition: ra288.c:240
AVFrame
This structure describes decoded (raw) audio or video data.
Definition: frame.h:340
compute_lpc_coefs
static int AAC_RENAME() compute_lpc_coefs(const LPC_TYPE *autoc, int max_order, LPC_TYPE *lpc, int lpc_stride, int fail, int normalize)
Levinson-Durbin recursion.
Definition: lpc.h:167
AVPacket::data
uint8_t * data
Definition: packet.h:491
MAX_BACKWARD_FILTER_NONREC
#define MAX_BACKWARD_FILTER_NONREC
Definition: ra288.c:38
FFCodec
Definition: codec_internal.h:127
backward_filter
static void backward_filter(RA288Context *ractx, float *hist, float *rec, const float *window, float *lpc, const float *tab, int order, int n, int non_rec, int move_size)
Backward synthesis filter, find the LPC coefficients from past speech data.
Definition: ra288.c:175
FFMAX
#define FFMAX(a, b)
Definition: macros.h:47
lpc.h
ff_celp_lp_synthesis_filterf
void ff_celp_lp_synthesis_filterf(float *out, const float *filter_coeffs, const float *in, int buffer_length, int filter_length)
LP synthesis filter.
Definition: celp_filters.c:85
AVFrame::data
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:361
get_bits
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:335
window
static SDL_Window * window
Definition: ffplay.c:360
FFCodec::p
AVCodec p
The public AVCodec.
Definition: codec_internal.h:131
AVCodecContext::ch_layout
AVChannelLayout ch_layout
Audio channel layout.
Definition: avcodec.h:2107
decode
static void decode(RA288Context *ractx, float gain, int cb_coef)
Definition: ra288.c:96
GetBitContext
Definition: get_bits.h:108
tab
static const struct twinvq_data tab
Definition: twinvq_data.h:10345
MAX_BACKWARD_FILTER_ORDER
#define MAX_BACKWARD_FILTER_ORDER
Definition: ra288.c:36
AVCodecContext::flags
int flags
AV_CODEC_FLAG_*.
Definition: avcodec.h:521
gain_window
static const float gain_window[FFALIGN(38, 16)]
Definition: ra288.h:123
syn_bw_tab
static const float syn_bw_tab[FFALIGN(36, 16)]
synthesis bandwidth broadening table
Definition: ra288.h:134
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
av_cold
#define av_cold
Definition: attributes.h:90
init_get_bits8
static int init_get_bits8(GetBitContext *s, const uint8_t *buffer, int byte_size)
Initialize GetBitContext.
Definition: get_bits.h:545
LOCAL_ALIGNED
#define LOCAL_ALIGNED(a, t, v,...)
Definition: mem_internal.h:112
FF_CODEC_DECODE_CB
#define FF_CODEC_DECODE_CB(func)
Definition: codec_internal.h:306
AVMEDIA_TYPE_AUDIO
@ AVMEDIA_TYPE_AUDIO
Definition: avutil.h:202
init
int(* init)(AVBSFContext *ctx)
Definition: dts2pts_bsf.c:365
do_hybrid_window
static void do_hybrid_window(RA288Context *ractx, int order, int n, int non_rec, float *out, float *hist, float *out2, const float *window)
Hybrid window filtering, see blocks 36 and 49 of the G.728 specification.
Definition: ra288.c:145
decode.h
get_bits.h
gain_bw_tab
static const float gain_bw_tab[FFALIGN(10, 16)]
gain bandwidth broadening table
Definition: ra288.h:144
CODEC_LONG_NAME
#define CODEC_LONG_NAME(str)
Definition: codec_internal.h:272
frame
static AVFrame * frame
Definition: demux_decode.c:54
AVERROR_PATCHWELCOME
#define AVERROR_PATCHWELCOME
Not yet implemented in FFmpeg, patches welcome.
Definition: error.h:64
work
must be printed separately If there s no standard function for printing the type you the WRITE_1D_FUNC_ARGV macro is a very quick way to create one See libavcodec dv_tablegen c for an example The h file This file should the initialization functions should not do and instead of the variable declarations the generated *_tables h file should be included Since that will be generated in the build the path must be i e not Makefile changes To make the automatic table creation work
Definition: tablegen.txt:66
RA288_BLOCKS_PER_FRAME
#define RA288_BLOCKS_PER_FRAME
Definition: ra288.c:41
RA288Context::sp_lpc
float sp_lpc[FFALIGN(36, 16)]
LPC coefficients for speech data (spec: A)
Definition: ra288.c:46
celp_filters.h
av_clipf
av_clipf
Definition: af_crystalizer.c:121
exp
int8_t exp
Definition: eval.c:72
ra288_decode_init
static av_cold int ra288_decode_init(AVCodecContext *avctx)
Definition: ra288.c:66
float_dsp.h
AV_CODEC_CAP_CHANNEL_CONF
#define AV_CODEC_CAP_CHANNEL_CONF
Codec should fill in channel configuration and samplerate instead of container.
Definition: codec.h:106
ff_get_buffer
int ff_get_buffer(AVCodecContext *avctx, AVFrame *frame, int flags)
Get a buffer for a frame.
Definition: decode.c:1617
AV_CODEC_CAP_DR1
#define AV_CODEC_CAP_DR1
Codec uses get_buffer() or get_encode_buffer() for allocating buffers and supports custom allocators.
Definition: codec.h:52
AVPacket::size
int size
Definition: packet.h:492
AVChannelLayout
An AVChannelLayout holds information about the channel layout of audio data.
Definition: channel_layout.h:307
codec_internal.h
DECLARE_ALIGNED
#define DECLARE_ALIGNED(n, t, v)
Definition: mem_internal.h:87
AVFloatDSPContext::vector_fmul
void(* vector_fmul)(float *dst, const float *src0, const float *src1, int len)
Calculate the entry wise product of two vectors of floats and store the result in a vector of floats.
Definition: float_dsp.h:38
for
for(k=2;k<=8;++k)
Definition: h264pred_template.c:425
AVCodecContext::sample_fmt
enum AVSampleFormat sample_fmt
audio sample format
Definition: avcodec.h:1080
AVFloatDSPContext
Definition: float_dsp.h:24
convolve
static void convolve(float *tgt, const float *src, int len, int n)
Definition: ra288.c:89
RA288Context
Definition: ra288.c:43
RA288_BLOCK_SIZE
#define RA288_BLOCK_SIZE
Definition: ra288.c:40
av_assert2
#define av_assert2(cond)
assert() equivalent, that does lie in speed critical code.
Definition: avassert.h:67
AV_CODEC_ID_RA_288
@ AV_CODEC_ID_RA_288
Definition: codec_id.h:428
AVFrame::nb_samples
int nb_samples
number of audio samples (per channel) described by this frame
Definition: frame.h:420
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:255
internal.h
ra288_decode_frame
static int ra288_decode_frame(AVCodecContext *avctx, AVFrame *frame, int *got_frame_ptr, AVPacket *avpkt)
Definition: ra288.c:190
AVCodec::name
const char * name
Name of the codec implementation.
Definition: codec.h:194
RA288Context::gain_lpc
float gain_lpc[FFALIGN(10, 16)]
LPC coefficients for gain (spec: GB)
Definition: ra288.c:47
len
int len
Definition: vorbis_enc_data.h:426
syn_window
static const float syn_window[FFALIGN(111, 16)]
Definition: ra288.h:101
RA288Context::gain_hist
float gain_hist[38]
log-gain history (spec: SBLG).
Definition: ra288.c:60
avcodec.h
RA288Context::vector_fmul
void(* vector_fmul)(float *dst, const float *src0, const float *src1, int len)
Definition: ra288.c:44
ret
ret
Definition: filter_design.txt:187
AVCodecContext::block_align
int block_align
number of bytes per packet if constant and known or 0 Used by some WAV based audio codecs.
Definition: avcodec.h:1113
RA288Context::sp_rec
float sp_rec[37]
speech part of the gain autocorrelation (spec: REXP)
Definition: ra288.c:55
RA288Context::gain_rec
float gain_rec[11]
recursive part of the gain autocorrelation (spec: REXPLG)
Definition: ra288.c:63
AVCodecContext
main external API structure.
Definition: avcodec.h:441
channel_layout.h
buffer
the frame and frame reference mechanism is intended to as much as expensive copies of that data while still allowing the filters to produce correct results The data is stored in buffers represented by AVFrame structures Several references can point to the same frame buffer
Definition: filter_design.txt:49
av_channel_layout_uninit
void av_channel_layout_uninit(AVChannelLayout *channel_layout)
Free any allocated data in the channel layout and reset the channel count to 0.
Definition: channel_layout.c:640
temp
else temp
Definition: vf_mcdeint.c:263
avpriv_scalarproduct_float_c
float avpriv_scalarproduct_float_c(const float *v1, const float *v2, int len)
Return the scalar product of two vectors.
Definition: float_dsp.c:124
src0
const pixel *const src0
Definition: h264pred_template.c:420
AV_CODEC_FLAG_BITEXACT
#define AV_CODEC_FLAG_BITEXACT
Use only bitexact stuff (except (I)DCT).
Definition: avcodec.h:338
AV_CHANNEL_LAYOUT_MONO
#define AV_CHANNEL_LAYOUT_MONO
Definition: channel_layout.h:382
amptable
static const float amptable[8]
Definition: ra288.h:29
av_free
#define av_free(p)
Definition: tableprint_vlc.h:33
FFALIGN
#define FFALIGN(x, a)
Definition: macros.h:78
AVPacket
This structure stores compressed data.
Definition: packet.h:468
AVCodecContext::priv_data
void * priv_data
Definition: avcodec.h:468
src
INIT_CLIP pixel * src
Definition: h264pred_template.c:418
avpriv_float_dsp_alloc
av_cold AVFloatDSPContext * avpriv_float_dsp_alloc(int bit_exact)
Allocate a float DSP context.
Definition: float_dsp.c:135
block
The exact code depends on how similar the blocks are and how related they are to the block
Definition: filter_design.txt:207
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
RA288Context::sp_hist
float sp_hist[111]
speech data history (spec: SB).
Definition: ra288.c:52
MAX_BACKWARD_FILTER_LEN
#define MAX_BACKWARD_FILTER_LEN
Definition: ra288.c:37
ra288.h
AV_SAMPLE_FMT_FLT
@ AV_SAMPLE_FMT_FLT
float
Definition: samplefmt.h:60