doxygen/4.1/vp3dsp_8c_source.html

 /*

  * Copyright (C) 2004 The FFmpeg project

  *

  * This file is part of FFmpeg.

  *

  * FFmpeg is free software; you can redistribute it and/or

  * modify it under the terms of the GNU Lesser General Public

  * License as published by the Free Software Foundation; either

  * version 2.1 of the License, or (at your option) any later version.

  *

  * FFmpeg is distributed in the hope that it will be useful,

  * but WITHOUT ANY WARRANTY; without even the implied warranty of

  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU

  * Lesser General Public License for more details.

  *

  * You should have received a copy of the GNU Lesser General Public

  * License along with FFmpeg; if not, write to the Free Software

  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA

  */


 /**

  * @file

  * Standard C DSP-oriented functions cribbed from the original VP3

  * source code.

  */


 #include "libavutil/attributes.h"

 #include "libavutil/common.h"

 #include "libavutil/intreadwrite.h"


 #include "avcodec.h"

 #include "rnd_avg.h"

 #include "vp3dsp.h"


 #define IdctAdjustBeforeShift 8

 #define xC1S7 64277

 #define xC2S6 60547

 #define xC3S5 54491

 #define xC4S4 46341

 #define xC5S3 36410

 #define xC6S2 25080

 #define xC7S1 12785


 #define M(a, b) ((int)((SUINT)(a) * (b)) >> 16)


 static av_always_inline void idct(uint8_t *dst, ptrdiff_t stride,

                                   int16_t *input, int type)

 {

     int16_t *ip = input;


     int A, B, C, D, Ad, Bd, Cd, Dd, E, F, G, H;

     int Ed, Gd, Add, Bdd, Fd, Hd;


     int i;


     /* Inverse DCT on the rows now */

     for (i = 0; i < 8; i++) {

         /* Check for non-zero values */

         if (ip[0 * 8] | ip[1 * 8] | ip[2 * 8] | ip[3 * 8] |

             ip[4 * 8] | ip[5 * 8] | ip[6 * 8] | ip[7 * 8]) {

             A = M(xC1S7, ip[1 * 8]) + M(xC7S1, ip[7 * 8]);

             B = M(xC7S1, ip[1 * 8]) - M(xC1S7, ip[7 * 8]);

             C = M(xC3S5, ip[3 * 8]) + M(xC5S3, ip[5 * 8]);

             D = M(xC3S5, ip[5 * 8]) - M(xC5S3, ip[3 * 8]);


             Ad = M(xC4S4, (A - C));

             Bd = M(xC4S4, (B - D));


             Cd = A + C;

             Dd = B + D;


             E = M(xC4S4, (ip[0 * 8] + ip[4 * 8]));

             F = M(xC4S4, (ip[0 * 8] - ip[4 * 8]));


             G = M(xC2S6, ip[2 * 8]) + M(xC6S2, ip[6 * 8]);

             H = M(xC6S2, ip[2 * 8]) - M(xC2S6, ip[6 * 8]);


             Ed = E - G;

             Gd = E + G;


             Add = F + Ad;

             Bdd = Bd - H;


             Fd = F - Ad;

             Hd = Bd + H;


             /*  Final sequence of operations over-write original inputs. */

             ip[0 * 8] = Gd + Cd;

             ip[7 * 8] = Gd - Cd;


             ip[1 * 8] = Add + Hd;

             ip[2 * 8] = Add - Hd;


             ip[3 * 8] = Ed + Dd;

             ip[4 * 8] = Ed - Dd;


             ip[5 * 8] = Fd + Bdd;

             ip[6 * 8] = Fd - Bdd;

         }


         ip += 1;            /* next row */

     }


     ip = input;


     for (i = 0; i < 8; i++) {

         /* Check for non-zero values (bitwise or faster than ||) */

         if (ip[1] | ip[2] | ip[3] |

             ip[4] | ip[5] | ip[6] | ip[7]) {

             A = M(xC1S7, ip[1]) + M(xC7S1, ip[7]);

             B = M(xC7S1, ip[1]) - M(xC1S7, ip[7]);

             C = M(xC3S5, ip[3]) + M(xC5S3, ip[5]);

             D = M(xC3S5, ip[5]) - M(xC5S3, ip[3]);


             Ad = M(xC4S4, (A - C));

             Bd = M(xC4S4, (B - D));


             Cd = A + C;

             Dd = B + D;


             E = M(xC4S4, (ip[0] + ip[4])) + 8;

             F = M(xC4S4, (ip[0] - ip[4])) + 8;


             if (type == 1) { // HACK

                 E += 16 * 128;

                 F += 16 * 128;

             }


             G = M(xC2S6, ip[2]) + M(xC6S2, ip[6]);

             H = M(xC6S2, ip[2]) - M(xC2S6, ip[6]);


             Ed = E - G;

             Gd = E + G;


             Add = F + Ad;

             Bdd = Bd - H;


             Fd = F - Ad;

             Hd = Bd + H;


             /* Final sequence of operations over-write original inputs. */

             if (type == 1) {

                 dst[0 * stride] = av_clip_uint8((Gd + Cd) >> 4);

                 dst[7 * stride] = av_clip_uint8((Gd - Cd) >> 4);


                 dst[1 * stride] = av_clip_uint8((Add + Hd) >> 4);

                 dst[2 * stride] = av_clip_uint8((Add - Hd) >> 4);


                 dst[3 * stride] = av_clip_uint8((Ed + Dd) >> 4);

                 dst[4 * stride] = av_clip_uint8((Ed - Dd) >> 4);


                 dst[5 * stride] = av_clip_uint8((Fd + Bdd) >> 4);

                 dst[6 * stride] = av_clip_uint8((Fd - Bdd) >> 4);

             } else {

                 dst[0 * stride] = av_clip_uint8(dst[0 * stride] + ((Gd + Cd) >> 4));

                 dst[7 * stride] = av_clip_uint8(dst[7 * stride] + ((Gd - Cd) >> 4));


                 dst[1 * stride] = av_clip_uint8(dst[1 * stride] + ((Add + Hd) >> 4));

                 dst[2 * stride] = av_clip_uint8(dst[2 * stride] + ((Add - Hd) >> 4));


                 dst[3 * stride] = av_clip_uint8(dst[3 * stride] + ((Ed + Dd) >> 4));

                 dst[4 * stride] = av_clip_uint8(dst[4 * stride] + ((Ed - Dd) >> 4));


                 dst[5 * stride] = av_clip_uint8(dst[5 * stride] + ((Fd + Bdd) >> 4));

                 dst[6 * stride] = av_clip_uint8(dst[6 * stride] + ((Fd - Bdd) >> 4));

             }

         } else {

             if (type == 1) {

                 dst[0*stride] =

                 dst[1*stride] =

                 dst[2*stride] =

                 dst[3*stride] =

                 dst[4*stride] =

                 dst[5*stride] =

                 dst[6*stride] =

                 dst[7*stride] = av_clip_uint8(128 + ((xC4S4 * ip[0] + (IdctAdjustBeforeShift << 16)) >> 20));

             } else {

                 if (ip[0]) {

                     int v = (xC4S4 * ip[0] + (IdctAdjustBeforeShift << 16)) >> 20;

                     dst[0 * stride] = av_clip_uint8(dst[0 * stride] + v);

                     dst[1 * stride] = av_clip_uint8(dst[1 * stride] + v);

                     dst[2 * stride] = av_clip_uint8(dst[2 * stride] + v);

                     dst[3 * stride] = av_clip_uint8(dst[3 * stride] + v);

                     dst[4 * stride] = av_clip_uint8(dst[4 * stride] + v);

                     dst[5 * stride] = av_clip_uint8(dst[5 * stride] + v);

                     dst[6 * stride] = av_clip_uint8(dst[6 * stride] + v);

                     dst[7 * stride] = av_clip_uint8(dst[7 * stride] + v);

                 }

             }

         }


         ip += 8;            /* next column */

         dst++;

     }

 }


 static void vp3_idct_put_c(uint8_t *dest /* align 8 */, ptrdiff_t stride,

                            int16_t *block /* align 16 */)

 {

     idct(dest, stride, block, 1);

     memset(block, 0, sizeof(*block) * 64);

 }


 static void vp3_idct_add_c(uint8_t *dest /* align 8 */, ptrdiff_t stride,

                            int16_t *block /* align 16 */)

 {

     idct(dest, stride, block, 2);

     memset(block, 0, sizeof(*block) * 64);

 }


 static void vp3_idct_dc_add_c(uint8_t *dest /* align 8 */, ptrdiff_t stride,

                               int16_t *block /* align 16 */)

 {

     int i, dc = (block[0] + 15) >> 5;


     for (i = 0; i < 8; i++) {

         dest[0] = av_clip_uint8(dest[0] + dc);

         dest[1] = av_clip_uint8(dest[1] + dc);

         dest[2] = av_clip_uint8(dest[2] + dc);

         dest[3] = av_clip_uint8(dest[3] + dc);

         dest[4] = av_clip_uint8(dest[4] + dc);

         dest[5] = av_clip_uint8(dest[5] + dc);

         dest[6] = av_clip_uint8(dest[6] + dc);

         dest[7] = av_clip_uint8(dest[7] + dc);

         dest   += stride;

     }

     block[0] = 0;

 }


 static void vp3_v_loop_filter_c(uint8_t *first_pixel, ptrdiff_t stride,

                                 int *bounding_values)

 {

     unsigned char *end;

     int filter_value;

     const ptrdiff_t nstride = -stride;


     for (end = first_pixel + 8; first_pixel < end; first_pixel++) {

         filter_value = (first_pixel[2 * nstride] - first_pixel[stride]) +

                        (first_pixel[0] - first_pixel[nstride]) * 3;

         filter_value = bounding_values[(filter_value + 4) >> 3];


         first_pixel[nstride] = av_clip_uint8(first_pixel[nstride] + filter_value);

         first_pixel[0]       = av_clip_uint8(first_pixel[0] - filter_value);

     }

 }


 static void vp3_h_loop_filter_c(uint8_t *first_pixel, ptrdiff_t stride,

                                 int *bounding_values)

 {

     unsigned char *end;

     int filter_value;


     for (end = first_pixel + 8 * stride; first_pixel != end; first_pixel += stride) {

         filter_value = (first_pixel[-2] - first_pixel[1]) +

                        (first_pixel[ 0] - first_pixel[-1]) * 3;

         filter_value = bounding_values[(filter_value + 4) >> 3];


         first_pixel[-1] = av_clip_uint8(first_pixel[-1] + filter_value);

         first_pixel[ 0] = av_clip_uint8(first_pixel[ 0] - filter_value);

     }

 }


 static void put_no_rnd_pixels_l2(uint8_t *dst, const uint8_t *src1,

                                  const uint8_t *src2, ptrdiff_t stride, int h)

 {

     int i;


     for (i = 0; i < h; i++) {

         uint32_t a, b;


         a = AV_RN32(&src1[i * stride]);

         b = AV_RN32(&src2[i * stride]);

         AV_WN32A(&dst[i * stride], no_rnd_avg32(a, b));

         a = AV_RN32(&src1[i * stride + 4]);

         b = AV_RN32(&src2[i * stride + 4]);

         AV_WN32A(&dst[i * stride + 4], no_rnd_avg32(a, b));

     }

 }


 av_cold void ff_vp3dsp_init(VP3DSPContext *c, int flags)

 {

     c->put_no_rnd_pixels_l2 = put_no_rnd_pixels_l2;


     c->idct_put      = vp3_idct_put_c;

     c->idct_add      = vp3_idct_add_c;

     c->idct_dc_add   = vp3_idct_dc_add_c;

     c->v_loop_filter = vp3_v_loop_filter_c;

     c->h_loop_filter = vp3_h_loop_filter_c;


     if (ARCH_ARM)

         ff_vp3dsp_init_arm(c, flags);

     if (ARCH_PPC)

         ff_vp3dsp_init_ppc(c, flags);

     if (ARCH_X86)

         ff_vp3dsp_init_x86(c, flags);

 }

VP3DSPContext::put_no_rnd_pixels_l2
void(* put_no_rnd_pixels_l2)(uint8_t *dst, const uint8_t *a, const uint8_t *b, ptrdiff_t stride, int h)
Copy 8xH pixels from source to destination buffer using a bilinear filter with no rounding (i...
Definition: vp3dsp.h:36

vp3_idct_put_c
static void vp3_idct_put_c(uint8_t *dest, ptrdiff_t stride, int16_t *block)
Definition: vp3dsp.c:197

h
h
Definition: vp9dsp_template.c:2038

vp3dsp.h

C
#define C

b
const char * b
Definition: vf_curves.c:116

xC4S4
#define xC4S4
Definition: vp3dsp.c:39

VP3DSPContext::v_loop_filter
void(* v_loop_filter)(uint8_t *src, ptrdiff_t stride, int *bounding_values)
Definition: vp3dsp.h:44

put_no_rnd_pixels_l2
static void put_no_rnd_pixels_l2(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, ptrdiff_t stride, int h)
Definition: vp3dsp.c:263

AV_WN32A
#define AV_WN32A(p, v)
Definition: intreadwrite.h:538

attributes.h
Macro definitions for various function/variable attributes.

block
static int16_t block[64]
Definition: dct.c:115

xC1S7
#define xC1S7
Definition: vp3dsp.c:36

M
#define M(a, b)
Definition: vp3dsp.c:44

uint8_t
uint8_t
Definition: audio_convert.c:194

av_cold
#define av_cold
Definition: attributes.h:82

end
static av_cold int end(AVCodecContext *avctx)
Definition: avrndec.c:90

VP3DSPContext
Definition: vp3dsp.h:25

A
#define A(x)
Definition: vp56_arith.h:28

vp3_idct_add_c
static void vp3_idct_add_c(uint8_t *dest, ptrdiff_t stride, int16_t *block)
Definition: vp3dsp.c:204

xC6S2
#define xC6S2
Definition: vp3dsp.c:41

vp3_v_loop_filter_c
static void vp3_v_loop_filter_c(uint8_t *first_pixel, ptrdiff_t stride, int *bounding_values)
Definition: vp3dsp.c:230

B
#define B
Definition: huffyuvdsp.h:32

xC2S6
#define xC2S6
Definition: vp3dsp.c:37

xC7S1
#define xC7S1
Definition: vp3dsp.c:42

VP3DSPContext::h_loop_filter
void(* h_loop_filter)(uint8_t *src, ptrdiff_t stride, int *bounding_values)
Definition: vp3dsp.h:45

VP3DSPContext::idct_dc_add
void(* idct_dc_add)(uint8_t *dest, ptrdiff_t stride, int16_t *block)
Definition: vp3dsp.h:43

no_rnd_avg32
static uint32_t no_rnd_avg32(uint32_t a, uint32_t b)
Definition: rnd_avg.h:36

E
#define E
Definition: avdct.c:32

filter_value
static int filter_value(int in, int rrp[8], int v[9])
Definition: gsmdec_template.c:72

vp3_h_loop_filter_c
static void vp3_h_loop_filter_c(uint8_t *first_pixel, ptrdiff_t stride, int *bounding_values)
Definition: vp3dsp.c:247

intreadwrite.h

src1
#define src1
Definition: h264pred.c:139

avcodec.h
Libavcodec external API header.

ff_vp3dsp_init_arm
av_cold void ff_vp3dsp_init_arm(VP3DSPContext *c, int flags)
Definition: vp3dsp_init_arm.c:33

type
GLint GLenum type
Definition: opengl_enc.c:105

vp3_idct_dc_add_c
static void vp3_idct_dc_add_c(uint8_t *dest, ptrdiff_t stride, int16_t *block)
Definition: vp3dsp.c:211

ff_vp3dsp_init_x86
void ff_vp3dsp_init_x86(VP3DSPContext *c, int flags)
Definition: vp3dsp_init.c:46

AV_RN32
#define AV_RN32(p)
Definition: intreadwrite.h:364

VP3DSPContext::idct_put
void(* idct_put)(uint8_t *dest, ptrdiff_t stride, int16_t *block)
Definition: vp3dsp.h:41

flags
#define flags(name, subs,...)
Definition: cbs_av1.c:596

VP3DSPContext::idct_add
void(* idct_add)(uint8_t *dest, ptrdiff_t stride, int16_t *block)
Definition: vp3dsp.h:42

xC3S5
#define xC3S5
Definition: vp3dsp.c:38

rnd_avg.h

stride
GLint GLenum GLboolean GLsizei stride
Definition: opengl_enc.c:105

common.h
common internal and external API header

G
#define G
Definition: huffyuvdsp.h:33

D
D(D(float, sse)
Definition: rematrix_init.c:28

c
static double c[64]
Definition: vsrc_mptestsrc.c:87

ff_vp3dsp_init_ppc
av_cold void ff_vp3dsp_init_ppc(VP3DSPContext *c, int flags)
Definition: vp3dsp_altivec.c:195

idct
static av_always_inline void idct(uint8_t *dst, ptrdiff_t stride, int16_t *input, int type)
Definition: vp3dsp.c:46

F
#define F(x)

H
#define H
Definition: pixlet.c:39

dc
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(constuint8_t *) pi-0x80)*(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(constint16_t *) pi >>8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t,*(constint16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(constint32_t *) pi >>24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t,*(constint32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(constfloat *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(constfloat *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(constfloat *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(constdouble *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(constdouble *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(constdouble *) pi *(1U<< 31))))#defineSET_CONV_FUNC_GROUP(ofmt, ifmt) staticvoidset_generic_function(AudioConvert *ac){}voidff_audio_convert_free(AudioConvert **ac){if(!*ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);}AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enumAVSampleFormatout_fmt, enumAVSampleFormatin_fmt, intchannels, intsample_rate, intapply_map){AudioConvert *ac;intin_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) returnNULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method!=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt)>2){ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc){av_free(ac);returnNULL;}returnac;}in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar){ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar?ac->channels:1;}elseif(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;elseac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);returnac;}intff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in){intuse_generic=1;intlen=in->nb_samples;intp;if(ac->dc){av_log(ac->avr, AV_LOG_TRACE,"%dsamples-audio_convert:%sto%s(dithered)\n", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));returnff_convert_dither(ac-> dc
Definition: audio_convert.c:194

av_always_inline
#define av_always_inline
Definition: attributes.h:39

IdctAdjustBeforeShift
#define IdctAdjustBeforeShift
Definition: vp3dsp.c:35

stride
#define stride

ff_vp3dsp_init
av_cold void ff_vp3dsp_init(VP3DSPContext *c, int flags)
Definition: vp3dsp.c:280

xC5S3
#define xC5S3
Definition: vp3dsp.c:40

a
a
Definition: h264pred_template.c:468