00001
00002
00003
00004
00005
00006
00007
00008
00009
00010
00011
00012
00013
00014
00015
00016
00017
00018
00019
00020
00021
00022 #ifndef AVCODEC_PSYMODEL_H
00023 #define AVCODEC_PSYMODEL_H
00024
00025 #include "avcodec.h"
00026
00028 #define PSY_MAX_BANDS 128
00029
00030 #define PSY_MAX_CHANS 20
00031
00035 typedef struct FFPsyBand {
00036 int bits;
00037 float energy;
00038 float threshold;
00039 float distortion;
00040 float perceptual_weight;
00041 } FFPsyBand;
00042
00046 typedef struct FFPsyChannel {
00047 FFPsyBand psy_bands[PSY_MAX_BANDS];
00048 float entropy;
00049 } FFPsyChannel;
00050
00054 typedef struct FFPsyChannelGroup {
00055 FFPsyChannel *ch[PSY_MAX_CHANS];
00056 uint8_t num_ch;
00057 uint8_t coupling[PSY_MAX_BANDS];
00058 } FFPsyChannelGroup;
00059
00063 typedef struct FFPsyWindowInfo {
00064 int window_type[3];
00065 int window_shape;
00066 int num_windows;
00067 int grouping[8];
00068 int *window_sizes;
00069 } FFPsyWindowInfo;
00070
00074 typedef struct FFPsyContext {
00075 AVCodecContext *avctx;
00076 const struct FFPsyModel *model;
00077
00078 FFPsyChannel *ch;
00079 FFPsyChannelGroup *group;
00080 int num_groups;
00081
00082 uint8_t **bands;
00083 int *num_bands;
00084 int num_lens;
00085
00086 struct {
00087 int size;
00088 int bits;
00089 } bitres;
00090
00091 void* model_priv_data;
00092 } FFPsyContext;
00093
00097 typedef struct FFPsyModel {
00098 const char *name;
00099 int (*init) (FFPsyContext *apc);
00100
00112 FFPsyWindowInfo (*window)(FFPsyContext *ctx, const float *audio, const float *la, int channel, int prev_type);
00113
00122 void (*analyze)(FFPsyContext *ctx, int channel, const float **coeffs, const FFPsyWindowInfo *wi);
00123
00124 void (*end) (FFPsyContext *apc);
00125 } FFPsyModel;
00126
00140 av_cold int ff_psy_init(FFPsyContext *ctx, AVCodecContext *avctx, int num_lens,
00141 const uint8_t **bands, const int* num_bands,
00142 int num_groups, const uint8_t *group_map);
00143
00152 FFPsyChannelGroup *ff_psy_find_group(FFPsyContext *ctx, int channel);
00153
00159 av_cold void ff_psy_end(FFPsyContext *ctx);
00160
00161
00162
00163
00164
00165
00166 struct FFPsyPreprocessContext;
00167
00171 av_cold struct FFPsyPreprocessContext* ff_psy_preprocess_init(AVCodecContext *avctx);
00172
00180 void ff_psy_preprocess(struct FFPsyPreprocessContext *ctx, float **audio, int channels);
00181
00185 av_cold void ff_psy_preprocess_end(struct FFPsyPreprocessContext *ctx);
00186
00187 #endif