libpostproc/postprocess_template.c File Reference

mmx/mmx2/3dnow postprocess code. More...

#include "libavutil/x86_cpu.h"

Go to the source code of this file.

Defines

#define REAL_PAVGB(a, b)   "pavgusb " #a ", " #b " \n\t"
#define PAVGB(a, b)   REAL_PAVGB(a,b)
#define PMINUB(b, a, t)
#define PMAXUB(a, b)
#define REAL_FIND_MIN_MAX(addr)
#define FIND_MIN_MAX(addr)   REAL_FIND_MIN_MAX(addr)
#define REAL_DERING_CORE(dst, src, ppsx, psx, sx, pplx, plx, lx, t0, t1)
#define DERING_CORE(dst, src, ppsx, psx, sx, pplx, plx, lx, t0, t1)   REAL_DERING_CORE(dst,src,ppsx,psx,sx,pplx,plx,lx,t0,t1)
#define REAL_DEINT_CUBIC(a, b, c, d, e)
#define DEINT_CUBIC(a, b, c, d, e)   REAL_DEINT_CUBIC(a,b,c,d,e)
#define REAL_DEINT_FF(a, b, c, d)
#define DEINT_FF(a, b, c, d)   REAL_DEINT_FF(a,b,c,d)
#define REAL_DEINT_L5(t1, t2, a, b, c)
#define DEINT_L5(t1, t2, a, b, c)   REAL_DEINT_L5(t1,t2,a,b,c)
#define REAL_MEDIAN(a, b, c)
#define MEDIAN(a, b, c)   REAL_MEDIAN(a,b,c)
#define FAST_L2_DIFF
#define REAL_L2_DIFF_CORE(a, b)
#define L2_DIFF_CORE(a, b)   REAL_L2_DIFF_CORE(a, b)
#define NEXT
#define PREV
#define REAL_SCALED_CPY(src1, src2, dst1, dst2)
#define SCALED_CPY(src1, src2, dst1, dst2)   REAL_SCALED_CPY(src1, src2, dst1, dst2)
#define REAL_SIMPLE_CPY(src1, src2, dst1, dst2)
#define SIMPLE_CPY(src1, src2, dst1, dst2)   REAL_SIMPLE_CPY(src1, src2, dst1, dst2)

Functions

static int vertClassify_TMPL (uint8_t src[], int stride, PPContext *c)
 Check if the middle 8x8 Block in the given 8x16 block is flat.
static void doVertLowPass_TMPL (uint8_t *src, int stride, PPContext *c)
 Do a vertical low pass filter on the 8x16 block (only write to the 8x8 block in the middle) using the 9-Tap Filter (1,1,2,2,4,2,2,1,1)/16.
static void vertX1Filter_TMPL (uint8_t *src, int stride, PPContext *co)
 Experimental Filter 1 will not damage linear gradients Flat blocks should look like they were passed through the (1,1,2,2,4,2,2,1,1) 9-Tap filter can only smooth blocks at the expected locations (it cannot smooth them if they did move) MMX2 version does correct clipping C version does not.
static void doVertDefFilter_TMPL (uint8_t src[], int stride, PPContext *c)
static void dering_TMPL (uint8_t src[], int stride, PPContext *c)
static void deInterlaceInterpolateLinear_TMPL (uint8_t src[], int stride)
 Deinterlace the given block by linearly interpolating every second line.
static void deInterlaceInterpolateCubic_TMPL (uint8_t src[], int stride)
 Deinterlace the given block by cubic interpolating every second line.
static void deInterlaceFF_TMPL (uint8_t src[], int stride, uint8_t *tmp)
 Deinterlace the given block by filtering every second line with a (-1 4 2 4 -1) filter.
static void deInterlaceL5_TMPL (uint8_t src[], int stride, uint8_t *tmp, uint8_t *tmp2)
 Deinterlace the given block by filtering every line with a (-1 2 6 2 -1) filter.
static void deInterlaceBlendLinear_TMPL (uint8_t src[], int stride, uint8_t *tmp)
 Deinterlace the given block by filtering all lines with a (1 2 1) filter.
static void deInterlaceMedian_TMPL (uint8_t src[], int stride)
 Deinterlace the given block by applying a median filter to every second line.
static void transpose1_TMPL (uint8_t *dst1, uint8_t *dst2, uint8_t *src, int srcStride)
 Transpose and shift the given 8x8 Block into dst1 and dst2.
static void transpose2_TMPL (uint8_t *dst, int dstStride, uint8_t *src)
 Transpose the given 8x8 block.
static void tempNoiseReducer_TMPL (uint8_t *src, int stride, uint8_t *tempBlurred, uint32_t *tempBlurredPast, int *maxNoise)
static av_always_inline void do_a_deblock_TMPL (uint8_t *src, int step, int stride, PPContext *c)
 accurate deblock filter
static void postProcess_TMPL (const uint8_t src[], int srcStride, uint8_t dst[], int dstStride, int width, int height, const QP_STORE_T QPs[], int QPStride, int isColor, PPContext *c2)
 Filter array of bytes (Y or U or V values).
static void blockCopy_TMPL (uint8_t dst[], int dstStride, const uint8_t src[], int srcStride, int levelFix, int64_t *packedOffsetAndScale)
 Copy a block from src to dst and fixes the blacklevel.
static void duplicate_TMPL (uint8_t src[], int stride)
 Duplicate the given 8 src pixels ? times upward.


Detailed Description

mmx/mmx2/3dnow postprocess code.

Definition in file postprocess_template.c.


Define Documentation

#define DEINT_CUBIC ( a,
b,
c,
d,
 )     REAL_DEINT_CUBIC(a,b,c,d,e)

#define DEINT_FF ( a,
b,
c,
 )     REAL_DEINT_FF(a,b,c,d)

Referenced by deInterlaceFF_TMPL().

#define DEINT_L5 ( t1,
t2,
a,
b,
c   )     REAL_DEINT_L5(t1,t2,a,b,c)

Referenced by deInterlaceL5_TMPL().

#define DERING_CORE ( dst,
src,
ppsx,
psx,
sx,
pplx,
plx,
lx,
t0,
t1   )     REAL_DERING_CORE(dst,src,ppsx,psx,sx,pplx,plx,lx,t0,t1)

Referenced by dering_TMPL().

#define FAST_L2_DIFF

#define FIND_MIN_MAX ( addr   )     REAL_FIND_MIN_MAX(addr)

Referenced by dering_TMPL().

#define L2_DIFF_CORE ( a,
 )     REAL_L2_DIFF_CORE(a, b)

Referenced by tempNoiseReducer_TMPL().

#define MEDIAN ( a,
b,
c   )     REAL_MEDIAN(a,b,c)

Referenced by deInterlaceMedian_TMPL().

#define NEXT

Value:

"movq (%0), %%mm2                       \n\t"\
            "movq (%0), %%mm3                       \n\t"\
            "add %1, %0                             \n\t"\
            "punpcklbw %%mm4, %%mm2                 \n\t"\
            "punpckhbw %%mm4, %%mm3                 \n\t"\
            "paddw %%mm2, %%mm0                     \n\t"\
            "paddw %%mm3, %%mm1                     \n\t"

Referenced by do_a_deblock_TMPL().

#define PAVGB ( a,
 )     REAL_PAVGB(a,b)

Definition at line 38 of file postprocess_template.c.

#define PMAXUB ( a,
 ) 

Value:

"psubusb " #a ", " #b " \n\t"\
    "paddb " #a ", " #b " \n\t"

Definition at line 52 of file postprocess_template.c.

#define PMINUB ( b,
a,
t   ) 

Value:

"movq " #a ", " #t " \n\t"\
    "psubusb " #b ", " #t " \n\t"\
    "psubb " #t ", " #a " \n\t"

Definition at line 43 of file postprocess_template.c.

Referenced by do_a_deblock_TMPL(), doVertDefFilter_TMPL(), and vertClassify_TMPL().

#define PREV

Value:

"movq (%0), %%mm2                       \n\t"\
            "movq (%0), %%mm3                       \n\t"\
            "add %1, %0                             \n\t"\
            "punpcklbw %%mm4, %%mm2                 \n\t"\
            "punpckhbw %%mm4, %%mm3                 \n\t"\
            "psubw %%mm2, %%mm0                     \n\t"\
            "psubw %%mm3, %%mm1                     \n\t"

Referenced by do_a_deblock_TMPL().

#define REAL_DEINT_CUBIC ( a,
b,
c,
d,
 ) 

Value:

"movq " #a ", %%mm0                     \n\t"\
        "movq " #b ", %%mm1                     \n\t"\
        "movq " #d ", %%mm2                     \n\t"\
        "movq " #e ", %%mm3                     \n\t"\
        PAVGB(%%mm2, %%mm1)                             /* (b+d) /2 */\
        PAVGB(%%mm3, %%mm0)                             /* a(a+e) /2 */\
        "movq %%mm0, %%mm2                      \n\t"\
        "punpcklbw %%mm7, %%mm0                 \n\t"\
        "punpckhbw %%mm7, %%mm2                 \n\t"\
        "movq %%mm1, %%mm3                      \n\t"\
        "punpcklbw %%mm7, %%mm1                 \n\t"\
        "punpckhbw %%mm7, %%mm3                 \n\t"\
        "psubw %%mm1, %%mm0                     \n\t"   /* L(a+e - (b+d))/2 */\
        "psubw %%mm3, %%mm2                     \n\t"   /* H(a+e - (b+d))/2 */\
        "psraw $3, %%mm0                        \n\t"   /* L(a+e - (b+d))/16 */\
        "psraw $3, %%mm2                        \n\t"   /* H(a+e - (b+d))/16 */\
        "psubw %%mm0, %%mm1                     \n\t"   /* L(9b + 9d - a - e)/16 */\
        "psubw %%mm2, %%mm3                     \n\t"   /* H(9b + 9d - a - e)/16 */\
        "packuswb %%mm3, %%mm1                  \n\t"\
        "movq %%mm1, " #c "                     \n\t"

#define REAL_DEINT_FF ( a,
b,
c,
 ) 

Value:

"movq " #a ", %%mm1                     \n\t"\
        "movq " #b ", %%mm2                     \n\t"\
        "movq " #c ", %%mm3                     \n\t"\
        "movq " #d ", %%mm4                     \n\t"\
        PAVGB(%%mm3, %%mm1)                          \
        PAVGB(%%mm4, %%mm0)                          \
        "movq %%mm0, %%mm3                      \n\t"\
        "punpcklbw %%mm7, %%mm0                 \n\t"\
        "punpckhbw %%mm7, %%mm3                 \n\t"\
        "movq %%mm1, %%mm4                      \n\t"\
        "punpcklbw %%mm7, %%mm1                 \n\t"\
        "punpckhbw %%mm7, %%mm4                 \n\t"\
        "psllw $2, %%mm1                        \n\t"\
        "psllw $2, %%mm4                        \n\t"\
        "psubw %%mm0, %%mm1                     \n\t"\
        "psubw %%mm3, %%mm4                     \n\t"\
        "movq %%mm2, %%mm5                      \n\t"\
        "movq %%mm2, %%mm0                      \n\t"\
        "punpcklbw %%mm7, %%mm2                 \n\t"\
        "punpckhbw %%mm7, %%mm5                 \n\t"\
        "paddw %%mm2, %%mm1                     \n\t"\
        "paddw %%mm5, %%mm4                     \n\t"\
        "psraw $2, %%mm1                        \n\t"\
        "psraw $2, %%mm4                        \n\t"\
        "packuswb %%mm4, %%mm1                  \n\t"\
        "movq %%mm1, " #b "                     \n\t"\

#define REAL_DEINT_L5 ( t1,
t2,
a,
b,
c   ) 

#define REAL_DERING_CORE ( dst,
src,
ppsx,
psx,
sx,
pplx,
plx,
lx,
t0,
t1   ) 

#define REAL_FIND_MIN_MAX ( addr   ) 

Value:

"movq " #addr ", %%mm0                  \n\t"\
        "movq %%mm7, %%mm1                      \n\t"\
        "psubusb %%mm0, %%mm6                   \n\t"\
        "paddb %%mm0, %%mm6                     \n\t"\
        "psubusb %%mm0, %%mm1                   \n\t"\
        "psubb %%mm1, %%mm7                     \n\t"

#define REAL_L2_DIFF_CORE ( a,
 ) 

Value:

"movq " #a ", %%mm5                     \n\t"\
        "movq " #b ", %%mm2                     \n\t"\
        "pxor %%mm7, %%mm2                      \n\t"\
        PAVGB(%%mm2, %%mm5)\
        "paddb %%mm6, %%mm5                     \n\t"\
        "movq %%mm5, %%mm2                      \n\t"\
        "psllw $8, %%mm5                        \n\t"\
        "pmaddwd %%mm5, %%mm5                   \n\t"\
        "pmaddwd %%mm2, %%mm2                   \n\t"\
        "paddd %%mm2, %%mm5                     \n\t"\
        "psrld $14, %%mm5                       \n\t"\
        "paddd %%mm5, %%mm0                     \n\t"

#define REAL_MEDIAN ( a,
b,
c   ) 

Value:

"movq " #a ", %%mm0                     \n\t"\
        "movq " #b ", %%mm2                     \n\t"\
        "movq " #c ", %%mm1                     \n\t"\
        "movq %%mm0, %%mm3                      \n\t"\
        "movq %%mm1, %%mm4                      \n\t"\
        "movq %%mm2, %%mm5                      \n\t"\
        "psubusb %%mm1, %%mm3                   \n\t"\
        "psubusb %%mm2, %%mm4                   \n\t"\
        "psubusb %%mm0, %%mm5                   \n\t"\
        "pcmpeqb %%mm7, %%mm3                   \n\t"\
        "pcmpeqb %%mm7, %%mm4                   \n\t"\
        "pcmpeqb %%mm7, %%mm5                   \n\t"\
        "movq %%mm3, %%mm6                      \n\t"\
        "pxor %%mm4, %%mm3                      \n\t"\
        "pxor %%mm5, %%mm4                      \n\t"\
        "pxor %%mm6, %%mm5                      \n\t"\
        "por %%mm3, %%mm1                       \n\t"\
        "por %%mm4, %%mm2                       \n\t"\
        "por %%mm5, %%mm0                       \n\t"\
        "pand %%mm2, %%mm0                      \n\t"\
        "pand %%mm1, %%mm0                      \n\t"\
        "movq %%mm0, " #b "                     \n\t"

#define REAL_PAVGB ( a,
 )     "pavgusb " #a ", " #b " \n\t"

Definition at line 36 of file postprocess_template.c.

#define REAL_SCALED_CPY ( src1,
src2,
dst1,
dst2   ) 

Value:

"movq " #src1 ", %%mm0          \n\t"\
        "movq " #src1 ", %%mm5          \n\t"\
        "punpcklbw %%mm4, %%mm0         \n\t"\
        "punpckhbw %%mm4, %%mm5         \n\t"\
        "psubw %%mm2, %%mm0             \n\t"\
        "psubw %%mm2, %%mm5             \n\t"\
        "movq " #src2 ", %%mm1          \n\t"\
        "psllw $6, %%mm0                \n\t"\
        "psllw $6, %%mm5                \n\t"\
        "pmulhw %%mm3, %%mm0            \n\t"\
        "movq " #src2 ", %%mm6          \n\t"\
        "pmulhw %%mm3, %%mm5            \n\t"\
        "punpcklbw %%mm4, %%mm1         \n\t"\
        "punpckhbw %%mm4, %%mm6         \n\t"\
        "psubw %%mm2, %%mm1             \n\t"\
        "psubw %%mm2, %%mm6             \n\t"\
        "psllw $6, %%mm1                \n\t"\
        "psllw $6, %%mm6                \n\t"\
        "pmulhw %%mm3, %%mm1            \n\t"\
        "pmulhw %%mm3, %%mm6            \n\t"\
        "packuswb %%mm5, %%mm0          \n\t"\
        "packuswb %%mm6, %%mm1          \n\t"\
        "movq %%mm0, " #dst1 "          \n\t"\
        "movq %%mm1, " #dst2 "          \n\t"\

#define REAL_SIMPLE_CPY ( src1,
src2,
dst1,
dst2   ) 

Value:

"movq " #src1 ", %%mm0          \n\t"\
        "movq " #src2 ", %%mm1          \n\t"\
        "movq %%mm0, " #dst1 "          \n\t"\
        "movq %%mm1, " #dst2 "          \n\t"\

#define SCALED_CPY ( src1,
src2,
dst1,
dst2   )     REAL_SCALED_CPY(src1, src2, dst1, dst2)

Referenced by blockCopy_TMPL().

#define SIMPLE_CPY ( src1,
src2,
dst1,
dst2   )     REAL_SIMPLE_CPY(src1, src2, dst1, dst2)

Referenced by blockCopy_TMPL().


Function Documentation

static void blockCopy_TMPL ( uint8_t  dst[],
int  dstStride,
const uint8_t  src[],
int  srcStride,
int  levelFix,
int64_t *  packedOffsetAndScale 
) [inline, static]

Copy a block from src to dst and fixes the blacklevel.

levelFix == 0 -> do not touch the brighness & contrast

Definition at line 3013 of file postprocess_template.c.

static void deInterlaceBlendLinear_TMPL ( uint8_t  src[],
int  stride,
uint8_t *  tmp 
) [inline, static]

Deinterlace the given block by filtering all lines with a (1 2 1) filter.

will be called for every 8x8 block and can read & write from line 4-15 lines 0-3 have been passed through the deblock / dering filters already, but can be read, too. lines 4-12 will be read into the deblocking filter and should be deinterlaced this filter will read lines 4-13 and write 4-11

Definition at line 1693 of file postprocess_template.c.

static void deInterlaceFF_TMPL ( uint8_t  src[],
int  stride,
uint8_t *  tmp 
) [inline, static]

Deinterlace the given block by filtering every second line with a (-1 4 2 4 -1) filter.

will be called for every 8x8 block and can read & write from line 4-15 lines 0-3 have been passed through the deblock / dering filters already, but can be read, too. lines 4-12 will be read into the deblocking filter and should be deinterlaced this filter will read lines 4-13 and write 5-11

Definition at line 1513 of file postprocess_template.c.

static void deInterlaceInterpolateCubic_TMPL ( uint8_t  src[],
int  stride 
) [inline, static]

Deinterlace the given block by cubic interpolating every second line.

will be called for every 8x8 block and can read & write from line 4-15 lines 0-3 have been passed through the deblock / dering filters already, but can be read, too. lines 4-12 will be read into the deblocking filter and should be deinterlaced this filter will read lines 3-15 and write 7-13

Definition at line 1449 of file postprocess_template.c.

static void deInterlaceInterpolateLinear_TMPL ( uint8_t  src[],
int  stride 
) [inline, static]

Deinterlace the given block by linearly interpolating every second line.

will be called for every 8x8 block and can read & write from line 4-15 lines 0-3 have been passed through the deblock / dering filters already, but can be read, too. lines 4-12 will be read into the deblocking filter and should be deinterlaced

Definition at line 1396 of file postprocess_template.c.

static void deInterlaceL5_TMPL ( uint8_t  src[],
int  stride,
uint8_t *  tmp,
uint8_t *  tmp2 
) [inline, static]

Deinterlace the given block by filtering every line with a (-1 2 6 2 -1) filter.

will be called for every 8x8 block and can read & write from line 4-15 lines 0-3 have been passed through the deblock / dering filters already, but can be read, too. lines 4-12 will be read into the deblocking filter and should be deinterlaced this filter will read lines 4-13 and write 4-11

Definition at line 1592 of file postprocess_template.c.

static void deInterlaceMedian_TMPL ( uint8_t  src[],
int  stride 
) [inline, static]

Deinterlace the given block by applying a median filter to every second line.

will be called for every 8x8 block and can read & write from line 4-15, lines 0-3 have been passed through the deblock / dering filters already, but can be read, too. lines 4-12 will be read into the deblocking filter and should be deinterlaced

Definition at line 1794 of file postprocess_template.c.

static void dering_TMPL ( uint8_t  src[],
int  stride,
PPContext c 
) [inline, static]

Definition at line 1041 of file postprocess_template.c.

static av_always_inline void do_a_deblock_TMPL ( uint8_t *  src,
int  step,
int  stride,
PPContext c 
) [static]

accurate deblock filter

Definition at line 2469 of file postprocess_template.c.

static void doVertDefFilter_TMPL ( uint8_t  src[],
int  stride,
PPContext c 
) [inline, static]

Definition at line 484 of file postprocess_template.c.

static void doVertLowPass_TMPL ( uint8_t *  src,
int  stride,
PPContext c 
) [inline, static]

Do a vertical low pass filter on the 8x16 block (only write to the 8x8 block in the middle) using the 9-Tap Filter (1,1,2,2,4,2,2,1,1)/16.

Definition at line 179 of file postprocess_template.c.

static void duplicate_TMPL ( uint8_t  src[],
int  stride 
) [inline, static]

Duplicate the given 8 src pixels ? times upward.

Definition at line 3141 of file postprocess_template.c.

static void postProcess_TMPL ( const uint8_t  src[],
int  srcStride,
uint8_t  dst[],
int  dstStride,
int  width,
int  height,
const QP_STORE_T  QPs[],
int  QPStride,
int  isColor,
PPContext c 
) [static]

Filter array of bytes (Y or U or V values).

Definition at line 3166 of file postprocess_template.c.

static void tempNoiseReducer_TMPL ( uint8_t *  src,
int  stride,
uint8_t *  tempBlurred,
uint32_t *  tempBlurredPast,
int *  maxNoise 
) [inline, static]

Definition at line 2080 of file postprocess_template.c.

static void transpose1_TMPL ( uint8_t *  dst1,
uint8_t *  dst2,
uint8_t *  src,
int  srcStride 
) [inline, static]

Transpose and shift the given 8x8 Block into dst1 and dst2.

Definition at line 1915 of file postprocess_template.c.

static void transpose2_TMPL ( uint8_t *  dst,
int  dstStride,
uint8_t *  src 
) [inline, static]

Transpose the given 8x8 block.

Definition at line 2000 of file postprocess_template.c.

static int vertClassify_TMPL ( uint8_t  src[],
int  stride,
PPContext c 
) [inline, static]

Check if the middle 8x8 Block in the given 8x16 block is flat.

Definition at line 62 of file postprocess_template.c.

static void vertX1Filter_TMPL ( uint8_t *  src,
int  stride,
PPContext co 
) [inline, static]

Experimental Filter 1 will not damage linear gradients Flat blocks should look like they were passed through the (1,1,2,2,4,2,2,1,1) 9-Tap filter can only smooth blocks at the expected locations (it cannot smooth them if they did move) MMX2 version does correct clipping C version does not.

Definition at line 358 of file postprocess_template.c.


Generated on Fri Oct 26 02:46:14 2012 for FFmpeg by  doxygen 1.5.8