33 int dstStride,
int src1Stride,
int h);
36 int src1Stride,
int h);
38 int dstStride,
int src1Stride,
int h);
40 int dstStride,
int src1Stride,
int h);
42 int dstStride,
int src1Stride,
int h);
44 int dstStride,
int src1Stride,
int h);
46 int dstStride,
int srcStride,
int h);
48 int dstStride,
int srcStride,
int h);
50 int dstStride,
int srcStride,
53 int dstStride,
int srcStride,
int h);
55 int dstStride,
int srcStride,
int h);
57 int dstStride,
int srcStride,
60 int dstStride,
int srcStride);
62 int dstStride,
int srcStride);
64 int dstStride,
int srcStride);
66 int dstStride,
int srcStride);
68 int dstStride,
int srcStride);
70 int dstStride,
int srcStride);
71 #define ff_put_no_rnd_pixels16_mmxext ff_put_pixels16_mmxext
72 #define ff_put_no_rnd_pixels8_mmxext ff_put_pixels8_mmxext
92 const int16_t *window,
unsigned int len);
94 const int16_t *window,
unsigned int len);
96 const int16_t *window,
unsigned int len);
98 const int16_t *window,
unsigned int len);
100 const int16_t *window,
unsigned int len);
102 const int16_t *window,
unsigned int len);
109 int *left,
int *left_top);
126 PIXELS16(
static, ff_avg, , , _mmxext)
127 PIXELS16(static, ff_put, , , _mmxext)
129 #define QPEL_OP(OPNAME, RND, MMX) \
130 static void OPNAME ## qpel8_mc00_ ## MMX (uint8_t *dst, uint8_t *src, \
133 ff_ ## OPNAME ## pixels8_ ## MMX(dst, src, stride, 8); \
136 static void OPNAME ## qpel8_mc10_ ## MMX(uint8_t *dst, uint8_t *src, \
140 uint8_t * const half = (uint8_t*)temp; \
141 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(half, src, 8, \
143 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, src, half, \
144 stride, stride, 8); \
147 static void OPNAME ## qpel8_mc20_ ## MMX(uint8_t *dst, uint8_t *src, \
150 ff_ ## OPNAME ## mpeg4_qpel8_h_lowpass_ ## MMX(dst, src, stride, \
154 static void OPNAME ## qpel8_mc30_ ## MMX(uint8_t *dst, uint8_t *src, \
158 uint8_t * const half = (uint8_t*)temp; \
159 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(half, src, 8, \
161 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, src + 1, half, stride, \
165 static void OPNAME ## qpel8_mc01_ ## MMX(uint8_t *dst, uint8_t *src, \
169 uint8_t * const half = (uint8_t*)temp; \
170 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(half, src, \
172 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, src, half, \
173 stride, stride, 8); \
176 static void OPNAME ## qpel8_mc02_ ## MMX(uint8_t *dst, uint8_t *src, \
179 ff_ ## OPNAME ## mpeg4_qpel8_v_lowpass_ ## MMX(dst, src, \
183 static void OPNAME ## qpel8_mc03_ ## MMX(uint8_t *dst, uint8_t *src, \
187 uint8_t * const half = (uint8_t*)temp; \
188 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(half, src, \
190 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, src + stride, half, stride,\
194 static void OPNAME ## qpel8_mc11_ ## MMX(uint8_t *dst, uint8_t *src, \
197 uint64_t half[8 + 9]; \
198 uint8_t * const halfH = ((uint8_t*)half) + 64; \
199 uint8_t * const halfHV = ((uint8_t*)half); \
200 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
202 ff_put ## RND ## pixels8_l2_ ## MMX(halfH, src, halfH, 8, \
204 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(halfHV, halfH, 8, 8);\
205 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, halfH, halfHV, \
209 static void OPNAME ## qpel8_mc31_ ## MMX(uint8_t *dst, uint8_t *src, \
212 uint64_t half[8 + 9]; \
213 uint8_t * const halfH = ((uint8_t*)half) + 64; \
214 uint8_t * const halfHV = ((uint8_t*)half); \
215 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
217 ff_put ## RND ## pixels8_l2_ ## MMX(halfH, src + 1, halfH, 8, \
219 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(halfHV, halfH, 8, 8);\
220 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, halfH, halfHV, \
224 static void OPNAME ## qpel8_mc13_ ## MMX(uint8_t *dst, uint8_t *src, \
227 uint64_t half[8 + 9]; \
228 uint8_t * const halfH = ((uint8_t*)half) + 64; \
229 uint8_t * const halfHV = ((uint8_t*)half); \
230 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
232 ff_put ## RND ## pixels8_l2_ ## MMX(halfH, src, halfH, 8, \
234 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(halfHV, halfH, 8, 8);\
235 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, halfH + 8, halfHV, \
239 static void OPNAME ## qpel8_mc33_ ## MMX(uint8_t *dst, uint8_t *src, \
242 uint64_t half[8 + 9]; \
243 uint8_t * const halfH = ((uint8_t*)half) + 64; \
244 uint8_t * const halfHV = ((uint8_t*)half); \
245 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
247 ff_put ## RND ## pixels8_l2_ ## MMX(halfH, src + 1, halfH, 8, \
249 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(halfHV, halfH, 8, 8);\
250 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, halfH + 8, halfHV, \
254 static void OPNAME ## qpel8_mc21_ ## MMX(uint8_t *dst, uint8_t *src, \
257 uint64_t half[8 + 9]; \
258 uint8_t * const halfH = ((uint8_t*)half) + 64; \
259 uint8_t * const halfHV = ((uint8_t*)half); \
260 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
262 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(halfHV, halfH, 8, 8);\
263 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, halfH, halfHV, \
267 static void OPNAME ## qpel8_mc23_ ## MMX(uint8_t *dst, uint8_t *src, \
270 uint64_t half[8 + 9]; \
271 uint8_t * const halfH = ((uint8_t*)half) + 64; \
272 uint8_t * const halfHV = ((uint8_t*)half); \
273 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
275 ff_put ## RND ## mpeg4_qpel8_v_lowpass_ ## MMX(halfHV, halfH, 8, 8);\
276 ff_ ## OPNAME ## pixels8_l2_ ## MMX(dst, halfH + 8, halfHV, \
280 static void OPNAME ## qpel8_mc12_ ## MMX(uint8_t *dst, uint8_t *src, \
283 uint64_t half[8 + 9]; \
284 uint8_t * const halfH = ((uint8_t*)half); \
285 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
287 ff_put ## RND ## pixels8_l2_ ## MMX(halfH, src, halfH, \
289 ff_ ## OPNAME ## mpeg4_qpel8_v_lowpass_ ## MMX(dst, halfH, \
293 static void OPNAME ## qpel8_mc32_ ## MMX(uint8_t *dst, uint8_t *src, \
296 uint64_t half[8 + 9]; \
297 uint8_t * const halfH = ((uint8_t*)half); \
298 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
300 ff_put ## RND ## pixels8_l2_ ## MMX(halfH, src + 1, halfH, 8, \
302 ff_ ## OPNAME ## mpeg4_qpel8_v_lowpass_ ## MMX(dst, halfH, \
306 static void OPNAME ## qpel8_mc22_ ## MMX(uint8_t *dst, uint8_t *src, \
310 uint8_t * const halfH = ((uint8_t*)half); \
311 ff_put ## RND ## mpeg4_qpel8_h_lowpass_ ## MMX(halfH, src, 8, \
313 ff_ ## OPNAME ## mpeg4_qpel8_v_lowpass_ ## MMX(dst, halfH, \
317 static void OPNAME ## qpel16_mc00_ ## MMX (uint8_t *dst, uint8_t *src, \
320 ff_ ## OPNAME ## pixels16_ ## MMX(dst, src, stride, 16); \
323 static void OPNAME ## qpel16_mc10_ ## MMX(uint8_t *dst, uint8_t *src, \
327 uint8_t * const half = (uint8_t*)temp; \
328 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(half, src, 16, \
330 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, src, half, stride, \
334 static void OPNAME ## qpel16_mc20_ ## MMX(uint8_t *dst, uint8_t *src, \
337 ff_ ## OPNAME ## mpeg4_qpel16_h_lowpass_ ## MMX(dst, src, \
338 stride, stride, 16);\
341 static void OPNAME ## qpel16_mc30_ ## MMX(uint8_t *dst, uint8_t *src, \
345 uint8_t * const half = (uint8_t*)temp; \
346 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(half, src, 16, \
348 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, src + 1, half, \
349 stride, stride, 16); \
352 static void OPNAME ## qpel16_mc01_ ## MMX(uint8_t *dst, uint8_t *src, \
356 uint8_t * const half = (uint8_t*)temp; \
357 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(half, src, 16, \
359 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, src, half, stride, \
363 static void OPNAME ## qpel16_mc02_ ## MMX(uint8_t *dst, uint8_t *src, \
366 ff_ ## OPNAME ## mpeg4_qpel16_v_lowpass_ ## MMX(dst, src, \
370 static void OPNAME ## qpel16_mc03_ ## MMX(uint8_t *dst, uint8_t *src, \
374 uint8_t * const half = (uint8_t*)temp; \
375 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(half, src, 16, \
377 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, src+stride, half, \
378 stride, stride, 16); \
381 static void OPNAME ## qpel16_mc11_ ## MMX(uint8_t *dst, uint8_t *src, \
384 uint64_t half[16 * 2 + 17 * 2]; \
385 uint8_t * const halfH = ((uint8_t*)half) + 256; \
386 uint8_t * const halfHV = ((uint8_t*)half); \
387 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
389 ff_put ## RND ## pixels16_l2_ ## MMX(halfH, src, halfH, 16, \
391 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(halfHV, halfH, \
393 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, halfH, halfHV, \
397 static void OPNAME ## qpel16_mc31_ ## MMX(uint8_t *dst, uint8_t *src, \
400 uint64_t half[16 * 2 + 17 * 2]; \
401 uint8_t * const halfH = ((uint8_t*)half) + 256; \
402 uint8_t * const halfHV = ((uint8_t*)half); \
403 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
405 ff_put ## RND ## pixels16_l2_ ## MMX(halfH, src + 1, halfH, 16, \
407 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(halfHV, halfH, \
409 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, halfH, halfHV, \
413 static void OPNAME ## qpel16_mc13_ ## MMX(uint8_t *dst, uint8_t *src, \
416 uint64_t half[16 * 2 + 17 * 2]; \
417 uint8_t * const halfH = ((uint8_t*)half) + 256; \
418 uint8_t * const halfHV = ((uint8_t*)half); \
419 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
421 ff_put ## RND ## pixels16_l2_ ## MMX(halfH, src, halfH, 16, \
423 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(halfHV, halfH, \
425 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, halfH + 16, halfHV, \
429 static void OPNAME ## qpel16_mc33_ ## MMX(uint8_t *dst, uint8_t *src, \
432 uint64_t half[16 * 2 + 17 * 2]; \
433 uint8_t * const halfH = ((uint8_t*)half) + 256; \
434 uint8_t * const halfHV = ((uint8_t*)half); \
435 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
437 ff_put ## RND ## pixels16_l2_ ## MMX(halfH, src + 1, halfH, 16, \
439 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(halfHV, halfH, \
441 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, halfH + 16, halfHV, \
445 static void OPNAME ## qpel16_mc21_ ## MMX(uint8_t *dst, uint8_t *src, \
448 uint64_t half[16 * 2 + 17 * 2]; \
449 uint8_t * const halfH = ((uint8_t*)half) + 256; \
450 uint8_t * const halfHV = ((uint8_t*)half); \
451 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
453 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(halfHV, halfH, \
455 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, halfH, halfHV, \
459 static void OPNAME ## qpel16_mc23_ ## MMX(uint8_t *dst, uint8_t *src, \
462 uint64_t half[16 * 2 + 17 * 2]; \
463 uint8_t * const halfH = ((uint8_t*)half) + 256; \
464 uint8_t * const halfHV = ((uint8_t*)half); \
465 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
467 ff_put ## RND ## mpeg4_qpel16_v_lowpass_ ## MMX(halfHV, halfH, \
469 ff_ ## OPNAME ## pixels16_l2_ ## MMX(dst, halfH + 16, halfHV, \
473 static void OPNAME ## qpel16_mc12_ ## MMX(uint8_t *dst, uint8_t *src, \
476 uint64_t half[17 * 2]; \
477 uint8_t * const halfH = ((uint8_t*)half); \
478 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
480 ff_put ## RND ## pixels16_l2_ ## MMX(halfH, src, halfH, 16, \
482 ff_ ## OPNAME ## mpeg4_qpel16_v_lowpass_ ## MMX(dst, halfH, \
486 static void OPNAME ## qpel16_mc32_ ## MMX(uint8_t *dst, uint8_t *src, \
489 uint64_t half[17 * 2]; \
490 uint8_t * const halfH = ((uint8_t*)half); \
491 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
493 ff_put ## RND ## pixels16_l2_ ## MMX(halfH, src + 1, halfH, 16, \
495 ff_ ## OPNAME ## mpeg4_qpel16_v_lowpass_ ## MMX(dst, halfH, \
499 static void OPNAME ## qpel16_mc22_ ## MMX(uint8_t *dst, uint8_t *src, \
502 uint64_t half[17 * 2]; \
503 uint8_t * const halfH = ((uint8_t*)half); \
504 ff_put ## RND ## mpeg4_qpel16_h_lowpass_ ## MMX(halfH, src, 16, \
506 ff_ ## OPNAME ## mpeg4_qpel16_v_lowpass_ ## MMX(dst, halfH, \
510 QPEL_OP(put_, _, mmxext)
511 QPEL_OP(avg_, _, mmxext)
512 QPEL_OP(put_no_rnd_, _no_rnd_, mmxext)
515 #define SET_QPEL_FUNCS(PFX, IDX, SIZE, CPU, PREFIX) \
517 c->PFX ## _pixels_tab[IDX][ 0] = PREFIX ## PFX ## SIZE ## _mc00_ ## CPU; \
518 c->PFX ## _pixels_tab[IDX][ 1] = PREFIX ## PFX ## SIZE ## _mc10_ ## CPU; \
519 c->PFX ## _pixels_tab[IDX][ 2] = PREFIX ## PFX ## SIZE ## _mc20_ ## CPU; \
520 c->PFX ## _pixels_tab[IDX][ 3] = PREFIX ## PFX ## SIZE ## _mc30_ ## CPU; \
521 c->PFX ## _pixels_tab[IDX][ 4] = PREFIX ## PFX ## SIZE ## _mc01_ ## CPU; \
522 c->PFX ## _pixels_tab[IDX][ 5] = PREFIX ## PFX ## SIZE ## _mc11_ ## CPU; \
523 c->PFX ## _pixels_tab[IDX][ 6] = PREFIX ## PFX ## SIZE ## _mc21_ ## CPU; \
524 c->PFX ## _pixels_tab[IDX][ 7] = PREFIX ## PFX ## SIZE ## _mc31_ ## CPU; \
525 c->PFX ## _pixels_tab[IDX][ 8] = PREFIX ## PFX ## SIZE ## _mc02_ ## CPU; \
526 c->PFX ## _pixels_tab[IDX][ 9] = PREFIX ## PFX ## SIZE ## _mc12_ ## CPU; \
527 c->PFX ## _pixels_tab[IDX][10] = PREFIX ## PFX ## SIZE ## _mc22_ ## CPU; \
528 c->PFX ## _pixels_tab[IDX][11] = PREFIX ## PFX ## SIZE ## _mc32_ ## CPU; \
529 c->PFX ## _pixels_tab[IDX][12] = PREFIX ## PFX ## SIZE ## _mc03_ ## CPU; \
530 c->PFX ## _pixels_tab[IDX][13] = PREFIX ## PFX ## SIZE ## _mc13_ ## CPU; \
531 c->PFX ## _pixels_tab[IDX][14] = PREFIX ## PFX ## SIZE ## _mc23_ ## CPU; \
532 c->PFX ## _pixels_tab[IDX][15] = PREFIX ## PFX ## SIZE ## _mc33_ ## CPU; \
545 if (!high_bit_depth) {
551 #if CONFIG_VIDEODSP && (ARCH_X86_32 || !HAVE_YASM)
558 #if HAVE_MMX_EXTERNAL
559 if (CONFIG_H263_DECODER || CONFIG_H263_ENCODER) {
571 #if HAVE_MMXEXT_INLINE
581 #if HAVE_MMXEXT_EXTERNAL
611 if (!high_bit_depth) {
623 #if HAVE_INLINE_ASM && CONFIG_VIDEODSP
643 #if HAVE_SSE2_EXTERNAL
663 #if HAVE_SSSE3_EXTERNAL
681 #if HAVE_SSE4_EXTERNAL
690 #if HAVE_7REGS && HAVE_INLINE_ASM