25 #include "libavutil/cpu.h"
32 ptrdiff_t line_size,
int h);
34 ptrdiff_t line_size,
int h);
36 ptrdiff_t line_size,
int h);
38 ptrdiff_t line_size,
int h);
40 ptrdiff_t line_size,
int h);
42 ptrdiff_t line_size,
int h);
45 ptrdiff_t line_size,
int h);
48 ptrdiff_t line_size,
int h);
50 ptrdiff_t line_size,
int h);
52 ptrdiff_t line_size,
int h);
54 ptrdiff_t line_size,
int h);
56 ptrdiff_t line_size,
int h);
59 ptrdiff_t line_size,
int h);
62 ptrdiff_t line_size,
int h);
64 ptrdiff_t line_size,
int h);
66 ptrdiff_t line_size,
int h);
68 ptrdiff_t line_size,
int h);
70 ptrdiff_t line_size,
int h);
72 ptrdiff_t line_size,
int h);
74 ptrdiff_t line_size,
int h);
76 ptrdiff_t line_size,
int h);
78 #define avg_pixels8_mmx ff_avg_pixels8_mmx
79 #define avg_pixels8_x2_mmx ff_avg_pixels8_x2_mmx
80 #define avg_pixels16_mmx ff_avg_pixels16_mmx
81 #define avg_pixels8_xy2_mmx ff_avg_pixels8_xy2_mmx
82 #define avg_pixels16_xy2_mmx ff_avg_pixels16_xy2_mmx
83 #define put_pixels8_mmx ff_put_pixels8_mmx
84 #define put_pixels16_mmx ff_put_pixels16_mmx
85 #define put_pixels8_xy2_mmx ff_put_pixels8_xy2_mmx
86 #define put_pixels16_xy2_mmx ff_put_pixels16_xy2_mmx
87 #define avg_no_rnd_pixels16_mmx ff_avg_pixels16_mmx
88 #define put_no_rnd_pixels8_mmx ff_put_pixels8_mmx
89 #define put_no_rnd_pixels16_mmx ff_put_pixels16_mmx
95 #define DEF(x, y) x ## _no_rnd_ ## y ## _mmx
96 #define SET_RND MOVQ_WONE
97 #define PAVGBP(a, b, c, d, e, f) PAVGBP_MMX_NO_RND(a, b, c, d, e, f)
98 #define PAVGB(a, b, c, e) PAVGB_MMX_NO_RND(a, b, c, e)
110 PIXELS16(
static, avg_no_rnd, , _y2, _mmx)
111 PIXELS16(static, put_no_rnd, , _y2, _mmx)
113 PIXELS16(static, avg_no_rnd, , _xy2, _mmx)
114 PIXELS16(static, put_no_rnd, , _xy2, _mmx)
119 #define DEF(x, y) x ## _ ## y ## _mmx
120 #define SET_RND MOVQ_WTWO
121 #define PAVGBP(a, b, c, d, e, f) PAVGBP_MMX(a, b, c, d, e, f)
122 #define PAVGB(a, b, c, e) PAVGB_MMX(a, b, c, e)
139 #define HPELDSP_AVG_PIXELS16(CPUEXT) \
140 PIXELS16(static, put_no_rnd, ff_, _x2, CPUEXT) \
141 PIXELS16(static, put, ff_, _y2, CPUEXT) \
142 PIXELS16(static, put_no_rnd, ff_, _y2, CPUEXT) \
143 PIXELS16(static, avg, ff_, , CPUEXT) \
144 PIXELS16(static, avg, ff_, _x2, CPUEXT) \
145 PIXELS16(static, avg, ff_, _y2, CPUEXT) \
146 PIXELS16(static, avg, ff_, _xy2, CPUEXT)
148 HPELDSP_AVG_PIXELS16(_3dnow)
149 HPELDSP_AVG_PIXELS16(_mmxext)
153 #define SET_HPEL_FUNCS(PFX, IDX, SIZE, CPU) \
155 c->PFX ## _pixels_tab IDX [0] = PFX ## _pixels ## SIZE ## _ ## CPU; \
156 c->PFX ## _pixels_tab IDX [1] = PFX ## _pixels ## SIZE ## _x2_ ## CPU; \
157 c->PFX ## _pixels_tab IDX [2] = PFX ## _pixels ## SIZE ## _y2_ ## CPU; \
158 c->PFX ## _pixels_tab IDX [3] = PFX ## _pixels ## SIZE ## _xy2_ ## CPU; \
176 #if HAVE_MMXEXT_EXTERNAL
210 #if HAVE_AMD3DNOW_EXTERNAL
244 #if HAVE_SSE2_EXTERNAL
void ff_put_pixels8_x2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_no_rnd_pixels8_y2_exact_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
op_pixels_func avg_pixels_tab[4][4]
Halfpel motion compensation with rounding (a+b+1)>>1.
static void hpeldsp_init_3dnow(HpelDSPContext *c, int flags, int cpu_flags)
static void hpeldsp_init_mmx(HpelDSPContext *c, int flags, int cpu_flags)
static void hpeldsp_init_mmxext(HpelDSPContext *c, int flags, int cpu_flags)
void ff_avg_pixels8_x2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_pixels8_x2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_no_rnd_pixels8_y2_exact_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_avg_pixels8_y2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_avg_pixels8_xy2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_pixels8_y2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
#define CODEC_FLAG_BITEXACT
Use only bitexact stuff (except (I)DCT).
int av_get_cpu_flags(void)
Return the flags which specify extensions supported by the CPU.
void ff_hpeldsp_init_x86(HpelDSPContext *c, int flags)
void ff_put_pixels16_x2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_no_rnd_pixels8_y2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_pixels16_sse2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
static void hpeldsp_init_sse2(HpelDSPContext *c, int flags, int cpu_flags)
#define SET_HPEL_FUNCS(PFX, IDX, SIZE, CPU)
void ff_avg_pixels8_x2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_no_rnd_pixels8_y2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
#define EXTERNAL_AMD3DNOW(flags)
#define INLINE_MMX(flags)
void ff_put_pixels16_x2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_avg_pixels8_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
op_pixels_func put_pixels_tab[4][4]
Halfpel motion compensation with rounding (a+b+1)>>1.
void ff_put_no_rnd_pixels8_x2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
op_pixels_func put_no_rnd_pixels_tab[4][4]
Halfpel motion compensation with no rounding (a+b)>>1.
void ff_avg_pixels8_xy2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
#define EXTERNAL_SSE2(flags)
void ff_put_no_rnd_pixels8_x2_exact_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_avg_pixels16_sse2(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
#define EXTERNAL_MMXEXT(flags)
void ff_avg_pixels8_y2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
#define CONFIG_VP3_DECODER
void ff_put_pixels8_y2_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
#define AV_CPU_FLAG_SSE2SLOW
SSE2 supported, but usually not faster.
void ff_avg_pixels8_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_no_rnd_pixels8_x2_mmxext(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
void ff_put_no_rnd_pixels8_x2_exact_3dnow(uint8_t *block, const uint8_t *pixels, ptrdiff_t line_size, int h)
#define PIXELS16(STATIC, PFX1, PFX2, TYPE, CPUEXT)