Mercurial > libavcodec.hg
annotate imgresample.c @ 2064:b77fe059dd09 libavcodec
fix normalization
| author | michael |
|---|---|
| date | Sun, 06 Jun 2004 20:15:53 +0000 |
| parents | 37ca6f8677de |
| children | 3dc9bbe1b152 |
| rev | line source |
|---|---|
| 0 | 1 /* |
| 2 * High quality image resampling with polyphase filters | |
| 429 | 3 * Copyright (c) 2001 Fabrice Bellard. |
| 0 | 4 * |
| 429 | 5 * This library is free software; you can redistribute it and/or |
| 6 * modify it under the terms of the GNU Lesser General Public | |
| 7 * License as published by the Free Software Foundation; either | |
| 8 * version 2 of the License, or (at your option) any later version. | |
| 0 | 9 * |
| 429 | 10 * This library is distributed in the hope that it will be useful, |
| 0 | 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 429 | 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 13 * Lesser General Public License for more details. | |
| 0 | 14 * |
| 429 | 15 * You should have received a copy of the GNU Lesser General Public |
| 16 * License along with this library; if not, write to the Free Software | |
| 17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA | |
| 0 | 18 */ |
| 1106 | 19 |
| 20 /** | |
| 21 * @file imgresample.c | |
| 22 * High quality image resampling with polyphase filters . | |
| 23 */ | |
| 24 | |
|
396
fce0a2520551
removed useless header includes - use av memory functions
glantau
parents:
18
diff
changeset
|
25 #include "avcodec.h" |
| 0 | 26 #include "dsputil.h" |
| 27 | |
| 17 | 28 #ifdef USE_FASTMEMCPY |
| 29 #include "fastmemcpy.h" | |
| 30 #endif | |
| 31 | |
| 0 | 32 #define NB_COMPONENTS 3 |
| 33 | |
| 34 #define PHASE_BITS 4 | |
| 35 #define NB_PHASES (1 << PHASE_BITS) | |
| 36 #define NB_TAPS 4 | |
| 37 #define FCENTER 1 /* index of the center of the filter */ | |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
38 //#define TEST 1 /* Test it */ |
| 0 | 39 |
| 40 #define POS_FRAC_BITS 16 | |
| 41 #define POS_FRAC (1 << POS_FRAC_BITS) | |
| 42 /* 6 bits precision is needed for MMX */ | |
| 43 #define FILTER_BITS 8 | |
| 44 | |
| 45 #define LINE_BUF_HEIGHT (NB_TAPS * 4) | |
| 46 | |
| 47 struct ImgReSampleContext { | |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
48 int iwidth, iheight, owidth, oheight; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
49 int topBand, bottomBand, leftBand, rightBand; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
50 int padtop, padbottom, padleft, padright; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
51 int pad_owidth, pad_oheight; |
| 0 | 52 int h_incr, v_incr; |
| 1064 | 53 int16_t h_filters[NB_PHASES][NB_TAPS] __align8; /* horizontal filters */ |
| 54 int16_t v_filters[NB_PHASES][NB_TAPS] __align8; /* vertical filters */ | |
| 55 uint8_t *line_buf; | |
| 0 | 56 }; |
| 57 | |
| 58 static inline int get_phase(int pos) | |
| 59 { | |
| 60 return ((pos) >> (POS_FRAC_BITS - PHASE_BITS)) & ((1 << PHASE_BITS) - 1); | |
| 61 } | |
| 62 | |
| 63 /* This function must be optimized */ | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
64 static void h_resample_fast(uint8_t *dst, int dst_width, const uint8_t *src, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
65 int src_width, int src_start, int src_incr, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
66 int16_t *filters) |
| 0 | 67 { |
| 68 int src_pos, phase, sum, i; | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
69 const uint8_t *s; |
| 1064 | 70 int16_t *filter; |
| 0 | 71 |
| 72 src_pos = src_start; | |
| 73 for(i=0;i<dst_width;i++) { | |
| 74 #ifdef TEST | |
| 75 /* test */ | |
| 76 if ((src_pos >> POS_FRAC_BITS) < 0 || | |
| 77 (src_pos >> POS_FRAC_BITS) > (src_width - NB_TAPS)) | |
| 653 | 78 av_abort(); |
| 0 | 79 #endif |
| 80 s = src + (src_pos >> POS_FRAC_BITS); | |
| 81 phase = get_phase(src_pos); | |
| 82 filter = filters + phase * NB_TAPS; | |
| 83 #if NB_TAPS == 4 | |
| 84 sum = s[0] * filter[0] + | |
| 85 s[1] * filter[1] + | |
| 86 s[2] * filter[2] + | |
| 87 s[3] * filter[3]; | |
| 88 #else | |
| 89 { | |
| 90 int j; | |
| 91 sum = 0; | |
| 92 for(j=0;j<NB_TAPS;j++) | |
| 93 sum += s[j] * filter[j]; | |
| 94 } | |
| 95 #endif | |
| 96 sum = sum >> FILTER_BITS; | |
| 97 if (sum < 0) | |
| 98 sum = 0; | |
| 99 else if (sum > 255) | |
| 100 sum = 255; | |
| 101 dst[0] = sum; | |
| 102 src_pos += src_incr; | |
| 103 dst++; | |
| 104 } | |
| 105 } | |
| 106 | |
| 107 /* This function must be optimized */ | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
108 static void v_resample(uint8_t *dst, int dst_width, const uint8_t *src, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
109 int wrap, int16_t *filter) |
| 0 | 110 { |
| 111 int sum, i; | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
112 const uint8_t *s; |
| 0 | 113 |
| 114 s = src; | |
| 115 for(i=0;i<dst_width;i++) { | |
| 116 #if NB_TAPS == 4 | |
| 117 sum = s[0 * wrap] * filter[0] + | |
| 118 s[1 * wrap] * filter[1] + | |
| 119 s[2 * wrap] * filter[2] + | |
| 120 s[3 * wrap] * filter[3]; | |
| 121 #else | |
| 122 { | |
| 123 int j; | |
| 1064 | 124 uint8_t *s1 = s; |
| 0 | 125 |
| 126 sum = 0; | |
| 127 for(j=0;j<NB_TAPS;j++) { | |
| 128 sum += s1[0] * filter[j]; | |
| 129 s1 += wrap; | |
| 130 } | |
| 131 } | |
| 132 #endif | |
| 133 sum = sum >> FILTER_BITS; | |
| 134 if (sum < 0) | |
| 135 sum = 0; | |
| 136 else if (sum > 255) | |
| 137 sum = 255; | |
| 138 dst[0] = sum; | |
| 139 dst++; | |
| 140 s++; | |
| 141 } | |
| 142 } | |
| 143 | |
| 2 | 144 #ifdef HAVE_MMX |
| 0 | 145 |
| 146 #include "i386/mmx.h" | |
| 147 | |
| 148 #define FILTER4(reg) \ | |
| 149 {\ | |
| 150 s = src + (src_pos >> POS_FRAC_BITS);\ | |
| 151 phase = get_phase(src_pos);\ | |
| 152 filter = filters + phase * NB_TAPS;\ | |
| 153 movq_m2r(*s, reg);\ | |
| 154 punpcklbw_r2r(mm7, reg);\ | |
| 155 movq_m2r(*filter, mm6);\ | |
| 156 pmaddwd_r2r(reg, mm6);\ | |
| 157 movq_r2r(mm6, reg);\ | |
| 158 psrlq_i2r(32, reg);\ | |
| 159 paddd_r2r(mm6, reg);\ | |
| 160 psrad_i2r(FILTER_BITS, reg);\ | |
| 161 src_pos += src_incr;\ | |
| 162 } | |
| 163 | |
| 164 #define DUMP(reg) movq_r2m(reg, tmp); printf(#reg "=%016Lx\n", tmp.uq); | |
| 165 | |
| 166 /* XXX: do four pixels at a time */ | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
167 static void h_resample_fast4_mmx(uint8_t *dst, int dst_width, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
168 const uint8_t *src, int src_width, |
| 1064 | 169 int src_start, int src_incr, int16_t *filters) |
| 0 | 170 { |
| 171 int src_pos, phase; | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
172 const uint8_t *s; |
| 1064 | 173 int16_t *filter; |
| 0 | 174 mmx_t tmp; |
| 175 | |
| 176 src_pos = src_start; | |
| 177 pxor_r2r(mm7, mm7); | |
| 178 | |
| 179 while (dst_width >= 4) { | |
| 180 | |
| 181 FILTER4(mm0); | |
| 182 FILTER4(mm1); | |
| 183 FILTER4(mm2); | |
| 184 FILTER4(mm3); | |
| 185 | |
| 186 packuswb_r2r(mm7, mm0); | |
| 187 packuswb_r2r(mm7, mm1); | |
| 188 packuswb_r2r(mm7, mm3); | |
| 189 packuswb_r2r(mm7, mm2); | |
| 190 movq_r2m(mm0, tmp); | |
| 191 dst[0] = tmp.ub[0]; | |
| 192 movq_r2m(mm1, tmp); | |
| 193 dst[1] = tmp.ub[0]; | |
| 194 movq_r2m(mm2, tmp); | |
| 195 dst[2] = tmp.ub[0]; | |
| 196 movq_r2m(mm3, tmp); | |
| 197 dst[3] = tmp.ub[0]; | |
| 198 dst += 4; | |
| 199 dst_width -= 4; | |
| 200 } | |
| 201 while (dst_width > 0) { | |
| 202 FILTER4(mm0); | |
| 203 packuswb_r2r(mm7, mm0); | |
| 204 movq_r2m(mm0, tmp); | |
| 205 dst[0] = tmp.ub[0]; | |
| 206 dst++; | |
| 207 dst_width--; | |
| 208 } | |
| 209 emms(); | |
| 210 } | |
| 211 | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
212 static void v_resample4_mmx(uint8_t *dst, int dst_width, const uint8_t *src, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
213 int wrap, int16_t *filter) |
| 0 | 214 { |
| 215 int sum, i, v; | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
216 const uint8_t *s; |
| 0 | 217 mmx_t tmp; |
| 218 mmx_t coefs[4]; | |
| 219 | |
| 220 for(i=0;i<4;i++) { | |
| 221 v = filter[i]; | |
| 222 coefs[i].uw[0] = v; | |
| 223 coefs[i].uw[1] = v; | |
| 224 coefs[i].uw[2] = v; | |
| 225 coefs[i].uw[3] = v; | |
| 226 } | |
| 227 | |
| 228 pxor_r2r(mm7, mm7); | |
| 229 s = src; | |
| 230 while (dst_width >= 4) { | |
| 231 movq_m2r(s[0 * wrap], mm0); | |
| 232 punpcklbw_r2r(mm7, mm0); | |
| 233 movq_m2r(s[1 * wrap], mm1); | |
| 234 punpcklbw_r2r(mm7, mm1); | |
| 235 movq_m2r(s[2 * wrap], mm2); | |
| 236 punpcklbw_r2r(mm7, mm2); | |
| 237 movq_m2r(s[3 * wrap], mm3); | |
| 238 punpcklbw_r2r(mm7, mm3); | |
| 239 | |
| 240 pmullw_m2r(coefs[0], mm0); | |
| 241 pmullw_m2r(coefs[1], mm1); | |
| 242 pmullw_m2r(coefs[2], mm2); | |
| 243 pmullw_m2r(coefs[3], mm3); | |
| 244 | |
| 245 paddw_r2r(mm1, mm0); | |
| 246 paddw_r2r(mm3, mm2); | |
| 247 paddw_r2r(mm2, mm0); | |
| 248 psraw_i2r(FILTER_BITS, mm0); | |
| 249 | |
| 250 packuswb_r2r(mm7, mm0); | |
| 251 movq_r2m(mm0, tmp); | |
| 252 | |
| 1064 | 253 *(uint32_t *)dst = tmp.ud[0]; |
| 0 | 254 dst += 4; |
| 255 s += 4; | |
| 256 dst_width -= 4; | |
| 257 } | |
| 258 while (dst_width > 0) { | |
| 259 sum = s[0 * wrap] * filter[0] + | |
| 260 s[1 * wrap] * filter[1] + | |
| 261 s[2 * wrap] * filter[2] + | |
| 262 s[3 * wrap] * filter[3]; | |
| 263 sum = sum >> FILTER_BITS; | |
| 264 if (sum < 0) | |
| 265 sum = 0; | |
| 266 else if (sum > 255) | |
| 267 sum = 255; | |
| 268 dst[0] = sum; | |
| 269 dst++; | |
| 270 s++; | |
| 271 dst_width--; | |
| 272 } | |
| 273 emms(); | |
| 274 } | |
| 275 #endif | |
| 276 | |
|
894
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
277 #ifdef HAVE_ALTIVEC |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
278 typedef union { |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
279 vector unsigned char v; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
280 unsigned char c[16]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
281 } vec_uc_t; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
282 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
283 typedef union { |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
284 vector signed short v; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
285 signed short s[8]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
286 } vec_ss_t; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
287 |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
288 void v_resample16_altivec(uint8_t *dst, int dst_width, const uint8_t *src, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
289 int wrap, int16_t *filter) |
|
894
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
290 { |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
291 int sum, i; |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
292 const uint8_t *s; |
|
894
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
293 vector unsigned char *tv, tmp, dstv, zero; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
294 vec_ss_t srchv[4], srclv[4], fv[4]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
295 vector signed short zeros, sumhv, sumlv; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
296 s = src; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
297 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
298 for(i=0;i<4;i++) |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
299 { |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
300 /* |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
301 The vec_madds later on does an implicit >>15 on the result. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
302 Since FILTER_BITS is 8, and we have 15 bits of magnitude in |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
303 a signed short, we have just enough bits to pre-shift our |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
304 filter constants <<7 to compensate for vec_madds. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
305 */ |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
306 fv[i].s[0] = filter[i] << (15-FILTER_BITS); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
307 fv[i].v = vec_splat(fv[i].v, 0); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
308 } |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
309 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
310 zero = vec_splat_u8(0); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
311 zeros = vec_splat_s16(0); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
312 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
313 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
314 /* |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
315 When we're resampling, we'd ideally like both our input buffers, |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
316 and output buffers to be 16-byte aligned, so we can do both aligned |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
317 reads and writes. Sadly we can't always have this at the moment, so |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
318 we opt for aligned writes, as unaligned writes have a huge overhead. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
319 To do this, do enough scalar resamples to get dst 16-byte aligned. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
320 */ |
|
898
6d5e3fe7aea1
Simplify an expression and eliminate a compile warning
philipjsg
parents:
894
diff
changeset
|
321 i = (-(int)dst) & 0xf; |
|
894
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
322 while(i>0) { |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
323 sum = s[0 * wrap] * filter[0] + |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
324 s[1 * wrap] * filter[1] + |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
325 s[2 * wrap] * filter[2] + |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
326 s[3 * wrap] * filter[3]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
327 sum = sum >> FILTER_BITS; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
328 if (sum<0) sum = 0; else if (sum>255) sum=255; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
329 dst[0] = sum; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
330 dst++; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
331 s++; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
332 dst_width--; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
333 i--; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
334 } |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
335 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
336 /* Do our altivec resampling on 16 pixels at once. */ |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
337 while(dst_width>=16) { |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
338 /* |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
339 Read 16 (potentially unaligned) bytes from each of |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
340 4 lines into 4 vectors, and split them into shorts. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
341 Interleave the multipy/accumulate for the resample |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
342 filter with the loads to hide the 3 cycle latency |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
343 the vec_madds have. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
344 */ |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
345 tv = (vector unsigned char *) &s[0 * wrap]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
346 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[i * wrap])); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
347 srchv[0].v = (vector signed short) vec_mergeh(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
348 srclv[0].v = (vector signed short) vec_mergel(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
349 sumhv = vec_madds(srchv[0].v, fv[0].v, zeros); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
350 sumlv = vec_madds(srclv[0].v, fv[0].v, zeros); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
351 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
352 tv = (vector unsigned char *) &s[1 * wrap]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
353 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[1 * wrap])); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
354 srchv[1].v = (vector signed short) vec_mergeh(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
355 srclv[1].v = (vector signed short) vec_mergel(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
356 sumhv = vec_madds(srchv[1].v, fv[1].v, sumhv); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
357 sumlv = vec_madds(srclv[1].v, fv[1].v, sumlv); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
358 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
359 tv = (vector unsigned char *) &s[2 * wrap]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
360 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[2 * wrap])); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
361 srchv[2].v = (vector signed short) vec_mergeh(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
362 srclv[2].v = (vector signed short) vec_mergel(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
363 sumhv = vec_madds(srchv[2].v, fv[2].v, sumhv); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
364 sumlv = vec_madds(srclv[2].v, fv[2].v, sumlv); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
365 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
366 tv = (vector unsigned char *) &s[3 * wrap]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
367 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[3 * wrap])); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
368 srchv[3].v = (vector signed short) vec_mergeh(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
369 srclv[3].v = (vector signed short) vec_mergel(zero, tmp); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
370 sumhv = vec_madds(srchv[3].v, fv[3].v, sumhv); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
371 sumlv = vec_madds(srclv[3].v, fv[3].v, sumlv); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
372 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
373 /* |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
374 Pack the results into our destination vector, |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
375 and do an aligned write of that back to memory. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
376 */ |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
377 dstv = vec_packsu(sumhv, sumlv) ; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
378 vec_st(dstv, 0, (vector unsigned char *) dst); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
379 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
380 dst+=16; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
381 s+=16; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
382 dst_width-=16; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
383 } |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
384 |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
385 /* |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
386 If there are any leftover pixels, resample them |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
387 with the slow scalar method. |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
388 */ |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
389 while(dst_width>0) { |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
390 sum = s[0 * wrap] * filter[0] + |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
391 s[1 * wrap] * filter[1] + |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
392 s[2 * wrap] * filter[2] + |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
393 s[3 * wrap] * filter[3]; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
394 sum = sum >> FILTER_BITS; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
395 if (sum<0) sum = 0; else if (sum>255) sum=255; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
396 dst[0] = sum; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
397 dst++; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
398 s++; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
399 dst_width--; |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
400 } |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
401 } |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
402 #endif |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
403 |
| 0 | 404 /* slow version to handle limit cases. Does not need optimisation */ |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
405 static void h_resample_slow(uint8_t *dst, int dst_width, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
406 const uint8_t *src, int src_width, |
| 1064 | 407 int src_start, int src_incr, int16_t *filters) |
| 0 | 408 { |
| 409 int src_pos, phase, sum, j, v, i; | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
410 const uint8_t *s, *src_end; |
| 1064 | 411 int16_t *filter; |
| 0 | 412 |
| 413 src_end = src + src_width; | |
| 414 src_pos = src_start; | |
| 415 for(i=0;i<dst_width;i++) { | |
| 416 s = src + (src_pos >> POS_FRAC_BITS); | |
| 417 phase = get_phase(src_pos); | |
| 418 filter = filters + phase * NB_TAPS; | |
| 419 sum = 0; | |
| 420 for(j=0;j<NB_TAPS;j++) { | |
| 421 if (s < src) | |
| 422 v = src[0]; | |
| 423 else if (s >= src_end) | |
| 424 v = src_end[-1]; | |
| 425 else | |
| 426 v = s[0]; | |
| 427 sum += v * filter[j]; | |
| 428 s++; | |
| 429 } | |
| 430 sum = sum >> FILTER_BITS; | |
| 431 if (sum < 0) | |
| 432 sum = 0; | |
| 433 else if (sum > 255) | |
| 434 sum = 255; | |
| 435 dst[0] = sum; | |
| 436 src_pos += src_incr; | |
| 437 dst++; | |
| 438 } | |
| 439 } | |
| 440 | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
441 static void h_resample(uint8_t *dst, int dst_width, const uint8_t *src, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
442 int src_width, int src_start, int src_incr, |
|
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
443 int16_t *filters) |
| 0 | 444 { |
| 445 int n, src_end; | |
| 446 | |
| 447 if (src_start < 0) { | |
| 448 n = (0 - src_start + src_incr - 1) / src_incr; | |
| 449 h_resample_slow(dst, n, src, src_width, src_start, src_incr, filters); | |
| 450 dst += n; | |
| 451 dst_width -= n; | |
| 452 src_start += n * src_incr; | |
| 453 } | |
| 454 src_end = src_start + dst_width * src_incr; | |
| 455 if (src_end > ((src_width - NB_TAPS) << POS_FRAC_BITS)) { | |
| 456 n = (((src_width - NB_TAPS + 1) << POS_FRAC_BITS) - 1 - src_start) / | |
| 457 src_incr; | |
| 458 } else { | |
| 459 n = dst_width; | |
| 460 } | |
| 2 | 461 #ifdef HAVE_MMX |
| 0 | 462 if ((mm_flags & MM_MMX) && NB_TAPS == 4) |
| 463 h_resample_fast4_mmx(dst, n, | |
| 464 src, src_width, src_start, src_incr, filters); | |
| 465 else | |
| 466 #endif | |
| 467 h_resample_fast(dst, n, | |
| 468 src, src_width, src_start, src_incr, filters); | |
| 469 if (n < dst_width) { | |
| 470 dst += n; | |
| 471 dst_width -= n; | |
| 472 src_start += n * src_incr; | |
| 473 h_resample_slow(dst, dst_width, | |
| 474 src, src_width, src_start, src_incr, filters); | |
| 475 } | |
| 476 } | |
| 477 | |
| 478 static void component_resample(ImgReSampleContext *s, | |
| 1064 | 479 uint8_t *output, int owrap, int owidth, int oheight, |
| 480 uint8_t *input, int iwrap, int iwidth, int iheight) | |
| 0 | 481 { |
| 482 int src_y, src_y1, last_src_y, ring_y, phase_y, y1, y; | |
| 1064 | 483 uint8_t *new_line, *src_line; |
| 0 | 484 |
| 485 last_src_y = - FCENTER - 1; | |
| 486 /* position of the bottom of the filter in the source image */ | |
| 487 src_y = (last_src_y + NB_TAPS) * POS_FRAC; | |
| 488 ring_y = NB_TAPS; /* position in ring buffer */ | |
| 489 for(y=0;y<oheight;y++) { | |
| 490 /* apply horizontal filter on new lines from input if needed */ | |
| 491 src_y1 = src_y >> POS_FRAC_BITS; | |
| 492 while (last_src_y < src_y1) { | |
| 493 if (++ring_y >= LINE_BUF_HEIGHT + NB_TAPS) | |
| 494 ring_y = NB_TAPS; | |
| 495 last_src_y++; | |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
496 /* handle limit conditions : replicate line (slightly |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
497 inefficient because we filter multiple times) */ |
| 0 | 498 y1 = last_src_y; |
| 499 if (y1 < 0) { | |
| 500 y1 = 0; | |
| 501 } else if (y1 >= iheight) { | |
| 502 y1 = iheight - 1; | |
| 503 } | |
| 504 src_line = input + y1 * iwrap; | |
| 505 new_line = s->line_buf + ring_y * owidth; | |
| 506 /* apply filter and handle limit cases correctly */ | |
| 507 h_resample(new_line, owidth, | |
| 508 src_line, iwidth, - FCENTER * POS_FRAC, s->h_incr, | |
| 509 &s->h_filters[0][0]); | |
| 510 /* handle ring buffer wraping */ | |
| 511 if (ring_y >= LINE_BUF_HEIGHT) { | |
| 512 memcpy(s->line_buf + (ring_y - LINE_BUF_HEIGHT) * owidth, | |
| 513 new_line, owidth); | |
| 514 } | |
| 515 } | |
| 516 /* apply vertical filter */ | |
| 517 phase_y = get_phase(src_y); | |
| 2 | 518 #ifdef HAVE_MMX |
| 0 | 519 /* desactivated MMX because loss of precision */ |
| 520 if ((mm_flags & MM_MMX) && NB_TAPS == 4 && 0) | |
| 521 v_resample4_mmx(output, owidth, | |
| 522 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth, | |
| 523 &s->v_filters[phase_y][0]); | |
| 524 else | |
| 525 #endif | |
|
894
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
526 #ifdef HAVE_ALTIVEC |
|
920
a0ad8e3452f2
practically disabling altivec resampling code (some ppl said its broken) patch by (Dieter Shirley <dieters at schemasoft dot com>)
michaelni
parents:
898
diff
changeset
|
527 if ((mm_flags & MM_ALTIVEC) && NB_TAPS == 4 && FILTER_BITS <= 6) |
|
894
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
528 v_resample16_altivec(output, owidth, |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
529 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth, |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
530 &s->v_filters[phase_y][0]); |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
531 else |
|
a408778eff87
altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents:
653
diff
changeset
|
532 #endif |
| 0 | 533 v_resample(output, owidth, |
| 534 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth, | |
| 535 &s->v_filters[phase_y][0]); | |
| 536 | |
| 537 src_y += s->v_incr; | |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
538 |
| 0 | 539 output += owrap; |
| 540 } | |
| 541 } | |
| 542 | |
| 543 /* XXX: the following filter is quite naive, but it seems to suffice | |
| 544 for 4 taps */ | |
| 1064 | 545 static void build_filter(int16_t *filter, float factor) |
| 0 | 546 { |
| 547 int ph, i, v; | |
| 2064 | 548 float x, y, tab[NB_TAPS], norm, mult, target; |
| 0 | 549 |
| 550 /* if upsampling, only need to interpolate, no filter */ | |
| 551 if (factor > 1.0) | |
| 552 factor = 1.0; | |
| 553 | |
| 554 for(ph=0;ph<NB_PHASES;ph++) { | |
| 555 norm = 0; | |
| 556 for(i=0;i<NB_TAPS;i++) { | |
| 2062 | 557 #if 1 |
| 558 const float d= -0.5; //first order derivative = -0.5 | |
| 559 x = fabs(((float)(i - FCENTER) - (float)ph / NB_PHASES) * factor); | |
| 560 if(x<1.0) y= 1 - 3*x*x + 2*x*x*x + d*( -x*x + x*x*x); | |
| 561 else y= d*(-4 + 8*x - 5*x*x + x*x*x); | |
| 562 #else | |
| 0 | 563 x = M_PI * ((float)(i - FCENTER) - (float)ph / NB_PHASES) * factor; |
| 564 if (x == 0) | |
| 565 y = 1.0; | |
| 566 else | |
| 567 y = sin(x) / x; | |
| 2062 | 568 #endif |
| 0 | 569 tab[i] = y; |
| 570 norm += y; | |
| 571 } | |
| 572 | |
| 573 /* normalize so that an uniform color remains the same */ | |
| 2064 | 574 target= 1 << FILTER_BITS; |
| 0 | 575 for(i=0;i<NB_TAPS;i++) { |
| 2064 | 576 mult = target / norm; |
| 577 v = lrintf(tab[i] * mult); | |
| 0 | 578 filter[ph * NB_TAPS + i] = v; |
| 2064 | 579 norm -= tab[i]; |
| 580 target -= v; | |
| 0 | 581 } |
| 582 } | |
| 583 } | |
| 584 | |
| 585 ImgReSampleContext *img_resample_init(int owidth, int oheight, | |
| 586 int iwidth, int iheight) | |
| 587 { | |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
588 return img_resample_full_init(owidth, oheight, iwidth, iheight, |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
589 0, 0, 0, 0, 0, 0, 0, 0); |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
590 } |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
591 |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
592 ImgReSampleContext *img_resample_full_init(int owidth, int oheight, |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
593 int iwidth, int iheight, |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
594 int topBand, int bottomBand, |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
595 int leftBand, int rightBand, |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
596 int padtop, int padbottom, |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
597 int padleft, int padright) |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
598 { |
| 0 | 599 ImgReSampleContext *s; |
| 600 | |
| 601 s = av_mallocz(sizeof(ImgReSampleContext)); | |
| 602 if (!s) | |
| 603 return NULL; | |
| 604 s->line_buf = av_mallocz(owidth * (LINE_BUF_HEIGHT + NB_TAPS)); | |
| 605 if (!s->line_buf) | |
| 606 goto fail; | |
| 607 | |
| 608 s->owidth = owidth; | |
| 609 s->oheight = oheight; | |
| 610 s->iwidth = iwidth; | |
| 611 s->iheight = iheight; | |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
612 |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
613 s->topBand = topBand; |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
614 s->bottomBand = bottomBand; |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
615 s->leftBand = leftBand; |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
616 s->rightBand = rightBand; |
| 0 | 617 |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
618 s->padtop = padtop; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
619 s->padbottom = padbottom; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
620 s->padleft = padleft; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
621 s->padright = padright; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
622 |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
623 s->pad_owidth = owidth - (padleft + padright); |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
624 s->pad_oheight = oheight - (padtop + padbottom); |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
625 |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
626 s->h_incr = ((iwidth - leftBand - rightBand) * POS_FRAC) / s->pad_owidth; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
627 s->v_incr = ((iheight - topBand - bottomBand) * POS_FRAC) / s->pad_oheight; |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
628 |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
629 build_filter(&s->h_filters[0][0], (float) s->pad_owidth / |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
630 (float) (iwidth - leftBand - rightBand)); |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
631 build_filter(&s->v_filters[0][0], (float) s->pad_oheight / |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
632 (float) (iheight - topBand - bottomBand)); |
| 0 | 633 |
| 634 return s; | |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
635 fail: |
|
396
fce0a2520551
removed useless header includes - use av memory functions
glantau
parents:
18
diff
changeset
|
636 av_free(s); |
| 0 | 637 return NULL; |
| 638 } | |
| 639 | |
| 640 void img_resample(ImgReSampleContext *s, | |
|
1488
766a2f4edbea
avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents:
1106
diff
changeset
|
641 AVPicture *output, const AVPicture *input) |
| 0 | 642 { |
| 643 int i, shift; | |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
644 uint8_t* optr; |
| 0 | 645 |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
646 for (i=0;i<3;i++) { |
| 0 | 647 shift = (i == 0) ? 0 : 1; |
|
1928
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
648 |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
649 optr = output->data[i] + (((output->linesize[i] * |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
650 s->padtop) + s->padleft) >> shift); |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
651 |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
652 component_resample(s, optr, output->linesize[i], |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
653 s->pad_owidth >> shift, s->pad_oheight >> shift, |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
654 input->data[i] + (input->linesize[i] * |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
655 (s->topBand >> shift)) + (s->leftBand >> shift), |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
656 input->linesize[i], ((s->iwidth - s->leftBand - |
|
0c23a5564489
padding support in ffmpeg patch by (Todd Kirby <doubleshot at pacbell dot net>)
michael
parents:
1488
diff
changeset
|
657 s->rightBand) >> shift), |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
658 (s->iheight - s->topBand - s->bottomBand) >> shift); |
| 0 | 659 } |
| 660 } | |
| 661 | |
| 662 void img_resample_close(ImgReSampleContext *s) | |
| 663 { | |
|
396
fce0a2520551
removed useless header includes - use av memory functions
glantau
parents:
18
diff
changeset
|
664 av_free(s->line_buf); |
|
fce0a2520551
removed useless header includes - use av memory functions
glantau
parents:
18
diff
changeset
|
665 av_free(s); |
| 0 | 666 } |
| 667 | |
| 668 #ifdef TEST | |
| 669 | |
| 670 void *av_mallocz(int size) | |
| 671 { | |
| 672 void *ptr; | |
| 673 ptr = malloc(size); | |
| 674 memset(ptr, 0, size); | |
| 675 return ptr; | |
| 676 } | |
| 677 | |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
678 void av_free(void *ptr) |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
679 { |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
680 /* XXX: this test should not be needed on most libcs */ |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
681 if (ptr) |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
682 free(ptr); |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
683 } |
|
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
684 |
| 0 | 685 /* input */ |
| 686 #define XSIZE 256 | |
| 687 #define YSIZE 256 | |
| 1064 | 688 uint8_t img[XSIZE * YSIZE]; |
| 0 | 689 |
| 690 /* output */ | |
| 691 #define XSIZE1 512 | |
| 692 #define YSIZE1 512 | |
| 1064 | 693 uint8_t img1[XSIZE1 * YSIZE1]; |
| 694 uint8_t img2[XSIZE1 * YSIZE1]; | |
| 0 | 695 |
| 1064 | 696 void save_pgm(const char *filename, uint8_t *img, int xsize, int ysize) |
| 0 | 697 { |
| 698 FILE *f; | |
| 699 f=fopen(filename,"w"); | |
| 700 fprintf(f,"P5\n%d %d\n%d\n", xsize, ysize, 255); | |
| 701 fwrite(img,1, xsize * ysize,f); | |
| 702 fclose(f); | |
| 703 } | |
| 704 | |
| 1064 | 705 static void dump_filter(int16_t *filter) |
| 0 | 706 { |
| 707 int i, ph; | |
| 708 | |
| 709 for(ph=0;ph<NB_PHASES;ph++) { | |
| 710 printf("%2d: ", ph); | |
| 711 for(i=0;i<NB_TAPS;i++) { | |
| 712 printf(" %5.2f", filter[ph * NB_TAPS + i] / 256.0); | |
| 713 } | |
| 714 printf("\n"); | |
| 715 } | |
| 716 } | |
| 717 | |
| 2 | 718 #ifdef HAVE_MMX |
| 644 | 719 int mm_flags; |
| 0 | 720 #endif |
| 721 | |
| 722 int main(int argc, char **argv) | |
| 723 { | |
| 724 int x, y, v, i, xsize, ysize; | |
| 725 ImgReSampleContext *s; | |
| 726 float fact, factors[] = { 1/2.0, 3.0/4.0, 1.0, 4.0/3.0, 16.0/9.0, 2.0 }; | |
| 727 char buf[256]; | |
| 728 | |
| 729 /* build test image */ | |
| 730 for(y=0;y<YSIZE;y++) { | |
| 731 for(x=0;x<XSIZE;x++) { | |
| 732 if (x < XSIZE/2 && y < YSIZE/2) { | |
| 733 if (x < XSIZE/4 && y < YSIZE/4) { | |
| 734 if ((x % 10) <= 6 && | |
| 735 (y % 10) <= 6) | |
| 736 v = 0xff; | |
| 737 else | |
| 738 v = 0x00; | |
| 739 } else if (x < XSIZE/4) { | |
| 740 if (x & 1) | |
| 741 v = 0xff; | |
| 742 else | |
| 743 v = 0; | |
| 744 } else if (y < XSIZE/4) { | |
| 745 if (y & 1) | |
| 746 v = 0xff; | |
| 747 else | |
| 748 v = 0; | |
| 749 } else { | |
| 750 if (y < YSIZE*3/8) { | |
| 751 if ((y+x) & 1) | |
| 752 v = 0xff; | |
| 753 else | |
| 754 v = 0; | |
| 755 } else { | |
| 756 if (((x+3) % 4) <= 1 && | |
| 757 ((y+3) % 4) <= 1) | |
| 758 v = 0xff; | |
| 759 else | |
| 760 v = 0x00; | |
| 761 } | |
| 762 } | |
| 763 } else if (x < XSIZE/2) { | |
| 764 v = ((x - (XSIZE/2)) * 255) / (XSIZE/2); | |
| 765 } else if (y < XSIZE/2) { | |
| 766 v = ((y - (XSIZE/2)) * 255) / (XSIZE/2); | |
| 767 } else { | |
| 768 v = ((x + y - XSIZE) * 255) / XSIZE; | |
| 769 } | |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
770 img[(YSIZE - y) * XSIZE + (XSIZE - x)] = v; |
| 0 | 771 } |
| 772 } | |
| 773 save_pgm("/tmp/in.pgm", img, XSIZE, YSIZE); | |
| 774 for(i=0;i<sizeof(factors)/sizeof(float);i++) { | |
| 775 fact = factors[i]; | |
| 776 xsize = (int)(XSIZE * fact); | |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
777 ysize = (int)((YSIZE - 100) * fact); |
| 644 | 778 s = img_resample_full_init(xsize, ysize, XSIZE, YSIZE, 50 ,50, 0, 0); |
| 0 | 779 printf("Factor=%0.2f\n", fact); |
| 780 dump_filter(&s->h_filters[0][0]); | |
| 781 component_resample(s, img1, xsize, xsize, ysize, | |
|
630
b4ee42142ad1
croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents:
429
diff
changeset
|
782 img + 50 * XSIZE, XSIZE, XSIZE, YSIZE - 100); |
| 0 | 783 img_resample_close(s); |
| 784 | |
| 785 sprintf(buf, "/tmp/out%d.pgm", i); | |
| 786 save_pgm(buf, img1, xsize, ysize); | |
| 787 } | |
| 788 | |
| 789 /* mmx test */ | |
| 2 | 790 #ifdef HAVE_MMX |
| 0 | 791 printf("MMX test\n"); |
| 792 fact = 0.72; | |
| 793 xsize = (int)(XSIZE * fact); | |
| 794 ysize = (int)(YSIZE * fact); | |
| 795 mm_flags = MM_MMX; | |
| 796 s = img_resample_init(xsize, ysize, XSIZE, YSIZE); | |
| 797 component_resample(s, img1, xsize, xsize, ysize, | |
| 798 img, XSIZE, XSIZE, YSIZE); | |
| 799 | |
| 800 mm_flags = 0; | |
| 801 s = img_resample_init(xsize, ysize, XSIZE, YSIZE); | |
| 802 component_resample(s, img2, xsize, xsize, ysize, | |
| 803 img, XSIZE, XSIZE, YSIZE); | |
| 804 if (memcmp(img1, img2, xsize * ysize) != 0) { | |
| 805 fprintf(stderr, "mmx error\n"); | |
| 806 exit(1); | |
| 807 } | |
| 808 printf("MMX OK\n"); | |
| 809 #endif | |
| 810 return 0; | |
| 811 } | |
| 812 | |
| 813 #endif |
