Mercurial > libavcodec.hg
annotate dsputil.h @ 214:73df666cacc7 libavcodec
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
| author | nickols_k |
|---|---|
| date | Sun, 20 Jan 2002 14:48:02 +0000 |
| parents | 9e0e56869d05 |
| children | ddb1a0e94cf4 |
| rev | line source |
|---|---|
| 0 | 1 #ifndef DSPUTIL_H |
| 2 #define DSPUTIL_H | |
| 3 | |
| 4 #include "common.h" | |
| 5 | |
| 6 /* dct code */ | |
| 7 typedef short DCTELEM; | |
| 8 | |
| 9 void jpeg_fdct_ifast (DCTELEM *data); | |
| 10 | |
| 11 void j_rev_dct (DCTELEM *data); | |
| 12 | |
| 13 void fdct_mmx(DCTELEM *block); | |
| 14 | |
| 15 void (*av_fdct)(DCTELEM *block); | |
| 16 | |
| 34 | 17 /* encoding scans */ |
| 18 extern UINT8 ff_alternate_horizontal_scan[64]; | |
| 19 extern UINT8 ff_alternate_vertical_scan[64]; | |
| 20 extern UINT8 zigzag_direct[64]; | |
| 21 | |
|
190
9e0e56869d05
fix for non-mmx runtimedetect encoding bugs - patch by Michael Niedermayer <michaelni@gmx.at>
uid46427
parents:
174
diff
changeset
|
22 /* permutation table */ |
|
9e0e56869d05
fix for non-mmx runtimedetect encoding bugs - patch by Michael Niedermayer <michaelni@gmx.at>
uid46427
parents:
174
diff
changeset
|
23 extern UINT8 permutation[64]; |
|
9e0e56869d05
fix for non-mmx runtimedetect encoding bugs - patch by Michael Niedermayer <michaelni@gmx.at>
uid46427
parents:
174
diff
changeset
|
24 |
| 0 | 25 /* pixel operations */ |
| 26 #define MAX_NEG_CROP 384 | |
| 27 | |
| 28 /* temporary */ | |
| 29 extern UINT32 squareTbl[512]; | |
| 50 | 30 extern UINT8 cropTbl[256 + 2 * MAX_NEG_CROP]; |
| 0 | 31 |
| 32 void dsputil_init(void); | |
| 33 | |
| 34 /* pixel ops : interface with DCT */ | |
| 35 | |
|
19
82d4c9be9873
MMX/MMXEXT iDCT support, using external functions currently defined in libmpeg2
arpi_esp
parents:
6
diff
changeset
|
36 extern void (*ff_idct)(DCTELEM *block); |
| 0 | 37 extern void (*get_pixels)(DCTELEM *block, const UINT8 *pixels, int line_size); |
| 38 extern void (*put_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size); | |
| 39 extern void (*add_pixels_clamped)(const DCTELEM *block, UINT8 *pixels, int line_size); | |
| 40 | |
| 41 void get_pixels_c(DCTELEM *block, const UINT8 *pixels, int line_size); | |
| 42 void put_pixels_clamped_c(const DCTELEM *block, UINT8 *pixels, int line_size); | |
| 43 void add_pixels_clamped_c(const DCTELEM *block, UINT8 *pixels, int line_size); | |
| 44 | |
| 45 /* add and put pixel (decoding) */ | |
| 46 typedef void (*op_pixels_func)(UINT8 *block, const UINT8 *pixels, int line_size, int h); | |
| 47 | |
| 48 extern op_pixels_func put_pixels_tab[4]; | |
| 49 extern op_pixels_func avg_pixels_tab[4]; | |
| 50 extern op_pixels_func put_no_rnd_pixels_tab[4]; | |
| 51 extern op_pixels_func avg_no_rnd_pixels_tab[4]; | |
| 52 | |
| 53 /* sub pixel (encoding) */ | |
| 54 extern void (*sub_pixels_tab[4])(DCTELEM *block, const UINT8 *pixels, int line_size, int h); | |
| 55 | |
| 56 #define sub_pixels_2(block, pixels, line_size, dxy) \ | |
| 57 sub_pixels_tab[dxy](block, pixels, line_size, 8) | |
| 58 | |
| 59 /* motion estimation */ | |
| 60 | |
| 61 typedef int (*op_pixels_abs_func)(UINT8 *blk1, UINT8 *blk2, int line_size, int h); | |
| 62 | |
| 63 extern op_pixels_abs_func pix_abs16x16; | |
| 64 extern op_pixels_abs_func pix_abs16x16_x2; | |
| 65 extern op_pixels_abs_func pix_abs16x16_y2; | |
| 66 extern op_pixels_abs_func pix_abs16x16_xy2; | |
| 67 | |
| 68 int pix_abs16x16_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | |
| 69 int pix_abs16x16_x2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | |
| 70 int pix_abs16x16_y2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | |
| 71 int pix_abs16x16_xy2_c(UINT8 *blk1, UINT8 *blk2, int lx, int h); | |
| 72 | |
|
174
ac5075a55488
new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable
arpi_esp
parents:
88
diff
changeset
|
73 static inline int block_permute_op(int j) |
|
ac5075a55488
new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable
arpi_esp
parents:
88
diff
changeset
|
74 { |
|
190
9e0e56869d05
fix for non-mmx runtimedetect encoding bugs - patch by Michael Niedermayer <michaelni@gmx.at>
uid46427
parents:
174
diff
changeset
|
75 return permutation[j]; |
|
174
ac5075a55488
new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable
arpi_esp
parents:
88
diff
changeset
|
76 } |
| 34 | 77 |
| 78 void block_permute(INT16 *block); | |
| 79 | |
| 62 | 80 #if defined(HAVE_MMX) |
| 0 | 81 |
| 82 #define MM_MMX 0x0001 /* standard MMX */ | |
| 83 #define MM_3DNOW 0x0004 /* AMD 3DNOW */ | |
| 84 #define MM_MMXEXT 0x0002 /* SSE integer functions or AMD MMX ext */ | |
| 85 #define MM_SSE 0x0008 /* SSE functions */ | |
| 86 #define MM_SSE2 0x0010 /* PIV SSE2 functions */ | |
| 87 | |
| 88 extern int mm_flags; | |
| 89 | |
| 90 int mm_support(void); | |
| 91 | |
| 92 static inline void emms(void) | |
| 93 { | |
|
6
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
94 __asm __volatile ("emms;":::"memory"); |
|
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
95 } |
|
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
96 |
|
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
97 #define emms_c() \ |
|
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
98 {\ |
|
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
99 if (mm_flags & MM_MMX)\ |
|
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
100 emms();\ |
| 0 | 101 } |
| 102 | |
| 103 #define __align8 __attribute__ ((aligned (8))) | |
| 104 | |
| 105 void dsputil_init_mmx(void); | |
| 106 | |
| 62 | 107 #elif defined(ARCH_ARMV4L) |
| 108 | |
| 109 #define emms_c() | |
| 110 | |
| 111 /* This is to use 4 bytes read to the IDCT pointers for some 'zero' | |
| 112 line ptimizations */ | |
| 113 #define __align8 __attribute__ ((aligned (4))) | |
| 114 | |
| 115 void dsputil_init_armv4l(void); | |
| 116 | |
| 88 | 117 #elif defined(HAVE_MLIB) |
| 118 | |
| 119 #define emms_c() | |
| 120 | |
| 121 /* SPARC/VIS IDCT needs 8-byte aligned DCT blocks */ | |
| 122 #define __align8 __attribute__ ((aligned (8))) | |
| 123 | |
| 124 void dsputil_init_mlib(void); | |
| 125 | |
|
214
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
190
diff
changeset
|
126 #elif defined(ARCH_ALPHA) |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
190
diff
changeset
|
127 |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
190
diff
changeset
|
128 #define emms_c() |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
190
diff
changeset
|
129 #define __align8 __attribute__ ((aligned (8))) |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
190
diff
changeset
|
130 |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
190
diff
changeset
|
131 void dsputil_init_alpha(void); |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
190
diff
changeset
|
132 |
| 0 | 133 #else |
| 134 | |
|
6
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
135 #define emms_c() |
|
ec4642daa6fe
added emms_c() macro which should can used in c code in both mmx/non mmx cases
glantau
parents:
2
diff
changeset
|
136 |
| 0 | 137 #define __align8 |
| 138 | |
| 139 #endif | |
| 140 | |
| 141 #endif |
