annotate src/ffmpeg/libavcodec/ppc/dsputil_ppc.h @ 808:e8776388b02a trunk

[svn] - add ffmpeg
author nenolod
date Mon, 12 Mar 2007 11:18:54 -0700
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
808
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
1 /*
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
2 * Copyright (c) 2003-2004 Romain Dolbeau <romain@dolbeau.org>
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
3 *
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
4 * This file is part of FFmpeg.
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
5 *
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
6 * FFmpeg is free software; you can redistribute it and/or
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
7 * modify it under the terms of the GNU Lesser General Public
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
8 * License as published by the Free Software Foundation; either
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
9 * version 2.1 of the License, or (at your option) any later version.
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
10 *
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
11 * FFmpeg is distributed in the hope that it will be useful,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
14 * Lesser General Public License for more details.
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
15 *
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
16 * You should have received a copy of the GNU Lesser General Public
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
17 * License along with FFmpeg; if not, write to the Free Software
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
19 */
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
20
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
21 #ifndef _DSPUTIL_PPC_
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
22 #define _DSPUTIL_PPC_
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
23
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
24 #ifdef POWERPC_PERFORMANCE_REPORT
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
25 void powerpc_display_perf_report(void);
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
26 /* the 604* have 2, the G3* have 4, the G4s have 6,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
27 and the G5 are completely different (they MUST use
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
28 POWERPC_MODE_64BITS, and let's hope all future 64 bis PPC
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
29 will use the same PMCs... */
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
30 #define POWERPC_NUM_PMC_ENABLED 6
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
31 /* if you add to the enum below, also add to the perfname array
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
32 in dsputil_ppc.c */
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
33 enum powerpc_perf_index {
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
34 altivec_fft_num = 0,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
35 altivec_gmc1_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
36 altivec_dct_unquantize_h263_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
37 altivec_fdct,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
38 altivec_idct_add_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
39 altivec_idct_put_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
40 altivec_put_pixels16_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
41 altivec_avg_pixels16_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
42 altivec_avg_pixels8_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
43 altivec_put_pixels8_xy2_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
44 altivec_put_no_rnd_pixels8_xy2_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
45 altivec_put_pixels16_xy2_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
46 altivec_put_no_rnd_pixels16_xy2_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
47 altivec_hadamard8_diff8x8_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
48 altivec_hadamard8_diff16_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
49 altivec_avg_pixels8_xy2_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
50 powerpc_clear_blocks_dcbz32,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
51 powerpc_clear_blocks_dcbz128,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
52 altivec_put_h264_chroma_mc8_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
53 altivec_avg_h264_chroma_mc8_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
54 altivec_put_h264_qpel16_h_lowpass_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
55 altivec_avg_h264_qpel16_h_lowpass_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
56 altivec_put_h264_qpel16_v_lowpass_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
57 altivec_avg_h264_qpel16_v_lowpass_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
58 altivec_put_h264_qpel16_hv_lowpass_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
59 altivec_avg_h264_qpel16_hv_lowpass_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
60 powerpc_perf_total
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
61 };
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
62 enum powerpc_data_index {
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
63 powerpc_data_min = 0,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
64 powerpc_data_max,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
65 powerpc_data_sum,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
66 powerpc_data_num,
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
67 powerpc_data_total
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
68 };
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
69 extern unsigned long long perfdata[POWERPC_NUM_PMC_ENABLED][powerpc_perf_total][powerpc_data_total];
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
70
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
71 #ifndef POWERPC_MODE_64BITS
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
72 #define POWERP_PMC_DATATYPE unsigned long
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
73 #define POWERPC_GET_PMC1(a) asm volatile("mfspr %0, 937" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
74 #define POWERPC_GET_PMC2(a) asm volatile("mfspr %0, 938" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
75 #if (POWERPC_NUM_PMC_ENABLED > 2)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
76 #define POWERPC_GET_PMC3(a) asm volatile("mfspr %0, 941" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
77 #define POWERPC_GET_PMC4(a) asm volatile("mfspr %0, 942" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
78 #else
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
79 #define POWERPC_GET_PMC3(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
80 #define POWERPC_GET_PMC4(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
81 #endif
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
82 #if (POWERPC_NUM_PMC_ENABLED > 4)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
83 #define POWERPC_GET_PMC5(a) asm volatile("mfspr %0, 929" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
84 #define POWERPC_GET_PMC6(a) asm volatile("mfspr %0, 930" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
85 #else
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
86 #define POWERPC_GET_PMC5(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
87 #define POWERPC_GET_PMC6(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
88 #endif
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
89 #else /* POWERPC_MODE_64BITS */
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
90 #define POWERP_PMC_DATATYPE unsigned long long
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
91 #define POWERPC_GET_PMC1(a) asm volatile("mfspr %0, 771" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
92 #define POWERPC_GET_PMC2(a) asm volatile("mfspr %0, 772" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
93 #if (POWERPC_NUM_PMC_ENABLED > 2)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
94 #define POWERPC_GET_PMC3(a) asm volatile("mfspr %0, 773" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
95 #define POWERPC_GET_PMC4(a) asm volatile("mfspr %0, 774" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
96 #else
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
97 #define POWERPC_GET_PMC3(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
98 #define POWERPC_GET_PMC4(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
99 #endif
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
100 #if (POWERPC_NUM_PMC_ENABLED > 4)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
101 #define POWERPC_GET_PMC5(a) asm volatile("mfspr %0, 775" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
102 #define POWERPC_GET_PMC6(a) asm volatile("mfspr %0, 776" : "=r" (a))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
103 #else
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
104 #define POWERPC_GET_PMC5(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
105 #define POWERPC_GET_PMC6(a) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
106 #endif
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
107 #endif /* POWERPC_MODE_64BITS */
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
108 #define POWERPC_PERF_DECLARE(a, cond) \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
109 POWERP_PMC_DATATYPE \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
110 pmc_start[POWERPC_NUM_PMC_ENABLED], \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
111 pmc_stop[POWERPC_NUM_PMC_ENABLED], \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
112 pmc_loop_index;
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
113 #define POWERPC_PERF_START_COUNT(a, cond) do { \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
114 POWERPC_GET_PMC6(pmc_start[5]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
115 POWERPC_GET_PMC5(pmc_start[4]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
116 POWERPC_GET_PMC4(pmc_start[3]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
117 POWERPC_GET_PMC3(pmc_start[2]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
118 POWERPC_GET_PMC2(pmc_start[1]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
119 POWERPC_GET_PMC1(pmc_start[0]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
120 } while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
121 #define POWERPC_PERF_STOP_COUNT(a, cond) do { \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
122 POWERPC_GET_PMC1(pmc_stop[0]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
123 POWERPC_GET_PMC2(pmc_stop[1]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
124 POWERPC_GET_PMC3(pmc_stop[2]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
125 POWERPC_GET_PMC4(pmc_stop[3]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
126 POWERPC_GET_PMC5(pmc_stop[4]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
127 POWERPC_GET_PMC6(pmc_stop[5]); \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
128 if (cond) \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
129 { \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
130 for(pmc_loop_index = 0; \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
131 pmc_loop_index < POWERPC_NUM_PMC_ENABLED; \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
132 pmc_loop_index++) \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
133 { \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
134 if (pmc_stop[pmc_loop_index] >= pmc_start[pmc_loop_index]) \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
135 { \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
136 POWERP_PMC_DATATYPE diff = \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
137 pmc_stop[pmc_loop_index] - pmc_start[pmc_loop_index]; \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
138 if (diff < perfdata[pmc_loop_index][a][powerpc_data_min]) \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
139 perfdata[pmc_loop_index][a][powerpc_data_min] = diff; \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
140 if (diff > perfdata[pmc_loop_index][a][powerpc_data_max]) \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
141 perfdata[pmc_loop_index][a][powerpc_data_max] = diff; \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
142 perfdata[pmc_loop_index][a][powerpc_data_sum] += diff; \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
143 perfdata[pmc_loop_index][a][powerpc_data_num] ++; \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
144 } \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
145 } \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
146 } \
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
147 } while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
148 #else /* POWERPC_PERFORMANCE_REPORT */
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
149 // those are needed to avoid empty statements.
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
150 #define POWERPC_PERF_DECLARE(a, cond) int altivec_placeholder __attribute__ ((unused))
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
151 #define POWERPC_PERF_START_COUNT(a, cond) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
152 #define POWERPC_PERF_STOP_COUNT(a, cond) do {} while (0)
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
153 #endif /* POWERPC_PERFORMANCE_REPORT */
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
154
e8776388b02a [svn] - add ffmpeg
nenolod
parents:
diff changeset
155 #endif /* _DSPUTIL_PPC_ */