annotate imgresample.c @ 1516:0f0e9dfa6723 libavcodec

theora decoding support (only keyframes for now, because by theora the frame isn't flipped so the motion vectors are getting screwed up)
author alex
date Sat, 11 Oct 2003 17:44:21 +0000
parents 766a2f4edbea
children 0c23a5564489
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
1 /*
986e461dc072 Initial revision
glantau
parents:
diff changeset
2 * High quality image resampling with polyphase filters
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
3 * Copyright (c) 2001 Fabrice Bellard.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
4 *
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
5 * This library is free software; you can redistribute it and/or
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
6 * modify it under the terms of the GNU Lesser General Public
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
7 * License as published by the Free Software Foundation; either
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
8 * version 2 of the License, or (at your option) any later version.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
9 *
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
10 * This library is distributed in the hope that it will be useful,
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
13 * Lesser General Public License for more details.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
14 *
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
15 * You should have received a copy of the GNU Lesser General Public
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
16 * License along with this library; if not, write to the Free Software
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
18 */
1106
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
19
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
20 /**
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
21 * @file imgresample.c
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
22 * High quality image resampling with polyphase filters .
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
23 */
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
24
396
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
25 #include "avcodec.h"
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
26 #include "dsputil.h"
986e461dc072 Initial revision
glantau
parents:
diff changeset
27
17
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
28 #ifdef USE_FASTMEMCPY
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
29 #include "fastmemcpy.h"
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
30 #endif
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
31
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
32 #define NB_COMPONENTS 3
986e461dc072 Initial revision
glantau
parents:
diff changeset
33
986e461dc072 Initial revision
glantau
parents:
diff changeset
34 #define PHASE_BITS 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
35 #define NB_PHASES (1 << PHASE_BITS)
986e461dc072 Initial revision
glantau
parents:
diff changeset
36 #define NB_TAPS 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
37 #define FCENTER 1 /* index of the center of the filter */
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
38 //#define TEST 1 /* Test it */
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
39
986e461dc072 Initial revision
glantau
parents:
diff changeset
40 #define POS_FRAC_BITS 16
986e461dc072 Initial revision
glantau
parents:
diff changeset
41 #define POS_FRAC (1 << POS_FRAC_BITS)
986e461dc072 Initial revision
glantau
parents:
diff changeset
42 /* 6 bits precision is needed for MMX */
986e461dc072 Initial revision
glantau
parents:
diff changeset
43 #define FILTER_BITS 8
986e461dc072 Initial revision
glantau
parents:
diff changeset
44
986e461dc072 Initial revision
glantau
parents:
diff changeset
45 #define LINE_BUF_HEIGHT (NB_TAPS * 4)
986e461dc072 Initial revision
glantau
parents:
diff changeset
46
986e461dc072 Initial revision
glantau
parents:
diff changeset
47 struct ImgReSampleContext {
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
48 int iwidth, iheight, owidth, oheight, topBand, bottomBand, leftBand, rightBand;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
49 int h_incr, v_incr;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
50 int16_t h_filters[NB_PHASES][NB_TAPS] __align8; /* horizontal filters */
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
51 int16_t v_filters[NB_PHASES][NB_TAPS] __align8; /* vertical filters */
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
52 uint8_t *line_buf;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
53 };
986e461dc072 Initial revision
glantau
parents:
diff changeset
54
986e461dc072 Initial revision
glantau
parents:
diff changeset
55 static inline int get_phase(int pos)
986e461dc072 Initial revision
glantau
parents:
diff changeset
56 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
57 return ((pos) >> (POS_FRAC_BITS - PHASE_BITS)) & ((1 << PHASE_BITS) - 1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
58 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
59
986e461dc072 Initial revision
glantau
parents:
diff changeset
60 /* This function must be optimized */
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
61 static void h_resample_fast(uint8_t *dst, int dst_width, const uint8_t *src,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
62 int src_width, int src_start, int src_incr,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
63 int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
64 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
65 int src_pos, phase, sum, i;
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
66 const uint8_t *s;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
67 int16_t *filter;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
68
986e461dc072 Initial revision
glantau
parents:
diff changeset
69 src_pos = src_start;
986e461dc072 Initial revision
glantau
parents:
diff changeset
70 for(i=0;i<dst_width;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
71 #ifdef TEST
986e461dc072 Initial revision
glantau
parents:
diff changeset
72 /* test */
986e461dc072 Initial revision
glantau
parents:
diff changeset
73 if ((src_pos >> POS_FRAC_BITS) < 0 ||
986e461dc072 Initial revision
glantau
parents:
diff changeset
74 (src_pos >> POS_FRAC_BITS) > (src_width - NB_TAPS))
653
714795876872 Change abort() calls to av_abort() calls.
philipjsg
parents: 644
diff changeset
75 av_abort();
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
76 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
77 s = src + (src_pos >> POS_FRAC_BITS);
986e461dc072 Initial revision
glantau
parents:
diff changeset
78 phase = get_phase(src_pos);
986e461dc072 Initial revision
glantau
parents:
diff changeset
79 filter = filters + phase * NB_TAPS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
80 #if NB_TAPS == 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
81 sum = s[0] * filter[0] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
82 s[1] * filter[1] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
83 s[2] * filter[2] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
84 s[3] * filter[3];
986e461dc072 Initial revision
glantau
parents:
diff changeset
85 #else
986e461dc072 Initial revision
glantau
parents:
diff changeset
86 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
87 int j;
986e461dc072 Initial revision
glantau
parents:
diff changeset
88 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
89 for(j=0;j<NB_TAPS;j++)
986e461dc072 Initial revision
glantau
parents:
diff changeset
90 sum += s[j] * filter[j];
986e461dc072 Initial revision
glantau
parents:
diff changeset
91 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
92 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
93 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
94 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
95 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
96 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
97 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
98 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
99 src_pos += src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
100 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
101 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
102 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
103
986e461dc072 Initial revision
glantau
parents:
diff changeset
104 /* This function must be optimized */
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
105 static void v_resample(uint8_t *dst, int dst_width, const uint8_t *src,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
106 int wrap, int16_t *filter)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
107 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
108 int sum, i;
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
109 const uint8_t *s;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
110
986e461dc072 Initial revision
glantau
parents:
diff changeset
111 s = src;
986e461dc072 Initial revision
glantau
parents:
diff changeset
112 for(i=0;i<dst_width;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
113 #if NB_TAPS == 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
114 sum = s[0 * wrap] * filter[0] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
115 s[1 * wrap] * filter[1] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
116 s[2 * wrap] * filter[2] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
117 s[3 * wrap] * filter[3];
986e461dc072 Initial revision
glantau
parents:
diff changeset
118 #else
986e461dc072 Initial revision
glantau
parents:
diff changeset
119 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
120 int j;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
121 uint8_t *s1 = s;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
122
986e461dc072 Initial revision
glantau
parents:
diff changeset
123 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
124 for(j=0;j<NB_TAPS;j++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
125 sum += s1[0] * filter[j];
986e461dc072 Initial revision
glantau
parents:
diff changeset
126 s1 += wrap;
986e461dc072 Initial revision
glantau
parents:
diff changeset
127 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
128 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
129 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
130 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
131 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
132 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
133 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
134 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
135 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
136 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
137 s++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
138 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
139 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
140
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
141 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
142
986e461dc072 Initial revision
glantau
parents:
diff changeset
143 #include "i386/mmx.h"
986e461dc072 Initial revision
glantau
parents:
diff changeset
144
986e461dc072 Initial revision
glantau
parents:
diff changeset
145 #define FILTER4(reg) \
986e461dc072 Initial revision
glantau
parents:
diff changeset
146 {\
986e461dc072 Initial revision
glantau
parents:
diff changeset
147 s = src + (src_pos >> POS_FRAC_BITS);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
148 phase = get_phase(src_pos);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
149 filter = filters + phase * NB_TAPS;\
986e461dc072 Initial revision
glantau
parents:
diff changeset
150 movq_m2r(*s, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
151 punpcklbw_r2r(mm7, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
152 movq_m2r(*filter, mm6);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
153 pmaddwd_r2r(reg, mm6);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
154 movq_r2r(mm6, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
155 psrlq_i2r(32, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
156 paddd_r2r(mm6, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
157 psrad_i2r(FILTER_BITS, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
158 src_pos += src_incr;\
986e461dc072 Initial revision
glantau
parents:
diff changeset
159 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
160
986e461dc072 Initial revision
glantau
parents:
diff changeset
161 #define DUMP(reg) movq_r2m(reg, tmp); printf(#reg "=%016Lx\n", tmp.uq);
986e461dc072 Initial revision
glantau
parents:
diff changeset
162
986e461dc072 Initial revision
glantau
parents:
diff changeset
163 /* XXX: do four pixels at a time */
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
164 static void h_resample_fast4_mmx(uint8_t *dst, int dst_width,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
165 const uint8_t *src, int src_width,
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
166 int src_start, int src_incr, int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
167 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
168 int src_pos, phase;
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
169 const uint8_t *s;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
170 int16_t *filter;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
171 mmx_t tmp;
986e461dc072 Initial revision
glantau
parents:
diff changeset
172
986e461dc072 Initial revision
glantau
parents:
diff changeset
173 src_pos = src_start;
986e461dc072 Initial revision
glantau
parents:
diff changeset
174 pxor_r2r(mm7, mm7);
986e461dc072 Initial revision
glantau
parents:
diff changeset
175
986e461dc072 Initial revision
glantau
parents:
diff changeset
176 while (dst_width >= 4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
177
986e461dc072 Initial revision
glantau
parents:
diff changeset
178 FILTER4(mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
179 FILTER4(mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
180 FILTER4(mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
181 FILTER4(mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
182
986e461dc072 Initial revision
glantau
parents:
diff changeset
183 packuswb_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
184 packuswb_r2r(mm7, mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
185 packuswb_r2r(mm7, mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
186 packuswb_r2r(mm7, mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
187 movq_r2m(mm0, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
188 dst[0] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
189 movq_r2m(mm1, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
190 dst[1] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
191 movq_r2m(mm2, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
192 dst[2] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
193 movq_r2m(mm3, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
194 dst[3] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
195 dst += 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
196 dst_width -= 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
197 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
198 while (dst_width > 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
199 FILTER4(mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
200 packuswb_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
201 movq_r2m(mm0, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
202 dst[0] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
203 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
204 dst_width--;
986e461dc072 Initial revision
glantau
parents:
diff changeset
205 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
206 emms();
986e461dc072 Initial revision
glantau
parents:
diff changeset
207 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
208
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
209 static void v_resample4_mmx(uint8_t *dst, int dst_width, const uint8_t *src,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
210 int wrap, int16_t *filter)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
211 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
212 int sum, i, v;
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
213 const uint8_t *s;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
214 mmx_t tmp;
986e461dc072 Initial revision
glantau
parents:
diff changeset
215 mmx_t coefs[4];
986e461dc072 Initial revision
glantau
parents:
diff changeset
216
986e461dc072 Initial revision
glantau
parents:
diff changeset
217 for(i=0;i<4;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
218 v = filter[i];
986e461dc072 Initial revision
glantau
parents:
diff changeset
219 coefs[i].uw[0] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
220 coefs[i].uw[1] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
221 coefs[i].uw[2] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
222 coefs[i].uw[3] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
223 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
224
986e461dc072 Initial revision
glantau
parents:
diff changeset
225 pxor_r2r(mm7, mm7);
986e461dc072 Initial revision
glantau
parents:
diff changeset
226 s = src;
986e461dc072 Initial revision
glantau
parents:
diff changeset
227 while (dst_width >= 4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
228 movq_m2r(s[0 * wrap], mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
229 punpcklbw_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
230 movq_m2r(s[1 * wrap], mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
231 punpcklbw_r2r(mm7, mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
232 movq_m2r(s[2 * wrap], mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
233 punpcklbw_r2r(mm7, mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
234 movq_m2r(s[3 * wrap], mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
235 punpcklbw_r2r(mm7, mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
236
986e461dc072 Initial revision
glantau
parents:
diff changeset
237 pmullw_m2r(coefs[0], mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
238 pmullw_m2r(coefs[1], mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
239 pmullw_m2r(coefs[2], mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
240 pmullw_m2r(coefs[3], mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
241
986e461dc072 Initial revision
glantau
parents:
diff changeset
242 paddw_r2r(mm1, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
243 paddw_r2r(mm3, mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
244 paddw_r2r(mm2, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
245 psraw_i2r(FILTER_BITS, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
246
986e461dc072 Initial revision
glantau
parents:
diff changeset
247 packuswb_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
248 movq_r2m(mm0, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
249
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
250 *(uint32_t *)dst = tmp.ud[0];
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
251 dst += 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
252 s += 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
253 dst_width -= 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
254 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
255 while (dst_width > 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
256 sum = s[0 * wrap] * filter[0] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
257 s[1 * wrap] * filter[1] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
258 s[2 * wrap] * filter[2] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
259 s[3 * wrap] * filter[3];
986e461dc072 Initial revision
glantau
parents:
diff changeset
260 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
261 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
262 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
263 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
264 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
265 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
266 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
267 s++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
268 dst_width--;
986e461dc072 Initial revision
glantau
parents:
diff changeset
269 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
270 emms();
986e461dc072 Initial revision
glantau
parents:
diff changeset
271 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
272 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
273
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
274 #ifdef HAVE_ALTIVEC
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
275 typedef union {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
276 vector unsigned char v;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
277 unsigned char c[16];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
278 } vec_uc_t;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
279
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
280 typedef union {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
281 vector signed short v;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
282 signed short s[8];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
283 } vec_ss_t;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
284
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
285 void v_resample16_altivec(uint8_t *dst, int dst_width, const uint8_t *src,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
286 int wrap, int16_t *filter)
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
287 {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
288 int sum, i;
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
289 const uint8_t *s;
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
290 vector unsigned char *tv, tmp, dstv, zero;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
291 vec_ss_t srchv[4], srclv[4], fv[4];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
292 vector signed short zeros, sumhv, sumlv;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
293 s = src;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
294
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
295 for(i=0;i<4;i++)
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
296 {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
297 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
298 The vec_madds later on does an implicit >>15 on the result.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
299 Since FILTER_BITS is 8, and we have 15 bits of magnitude in
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
300 a signed short, we have just enough bits to pre-shift our
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
301 filter constants <<7 to compensate for vec_madds.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
302 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
303 fv[i].s[0] = filter[i] << (15-FILTER_BITS);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
304 fv[i].v = vec_splat(fv[i].v, 0);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
305 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
306
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
307 zero = vec_splat_u8(0);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
308 zeros = vec_splat_s16(0);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
309
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
310
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
311 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
312 When we're resampling, we'd ideally like both our input buffers,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
313 and output buffers to be 16-byte aligned, so we can do both aligned
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
314 reads and writes. Sadly we can't always have this at the moment, so
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
315 we opt for aligned writes, as unaligned writes have a huge overhead.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
316 To do this, do enough scalar resamples to get dst 16-byte aligned.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
317 */
898
6d5e3fe7aea1 Simplify an expression and eliminate a compile warning
philipjsg
parents: 894
diff changeset
318 i = (-(int)dst) & 0xf;
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
319 while(i>0) {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
320 sum = s[0 * wrap] * filter[0] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
321 s[1 * wrap] * filter[1] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
322 s[2 * wrap] * filter[2] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
323 s[3 * wrap] * filter[3];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
324 sum = sum >> FILTER_BITS;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
325 if (sum<0) sum = 0; else if (sum>255) sum=255;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
326 dst[0] = sum;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
327 dst++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
328 s++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
329 dst_width--;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
330 i--;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
331 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
332
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
333 /* Do our altivec resampling on 16 pixels at once. */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
334 while(dst_width>=16) {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
335 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
336 Read 16 (potentially unaligned) bytes from each of
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
337 4 lines into 4 vectors, and split them into shorts.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
338 Interleave the multipy/accumulate for the resample
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
339 filter with the loads to hide the 3 cycle latency
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
340 the vec_madds have.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
341 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
342 tv = (vector unsigned char *) &s[0 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
343 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[i * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
344 srchv[0].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
345 srclv[0].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
346 sumhv = vec_madds(srchv[0].v, fv[0].v, zeros);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
347 sumlv = vec_madds(srclv[0].v, fv[0].v, zeros);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
348
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
349 tv = (vector unsigned char *) &s[1 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
350 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[1 * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
351 srchv[1].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
352 srclv[1].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
353 sumhv = vec_madds(srchv[1].v, fv[1].v, sumhv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
354 sumlv = vec_madds(srclv[1].v, fv[1].v, sumlv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
355
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
356 tv = (vector unsigned char *) &s[2 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
357 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[2 * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
358 srchv[2].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
359 srclv[2].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
360 sumhv = vec_madds(srchv[2].v, fv[2].v, sumhv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
361 sumlv = vec_madds(srclv[2].v, fv[2].v, sumlv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
362
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
363 tv = (vector unsigned char *) &s[3 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
364 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[3 * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
365 srchv[3].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
366 srclv[3].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
367 sumhv = vec_madds(srchv[3].v, fv[3].v, sumhv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
368 sumlv = vec_madds(srclv[3].v, fv[3].v, sumlv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
369
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
370 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
371 Pack the results into our destination vector,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
372 and do an aligned write of that back to memory.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
373 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
374 dstv = vec_packsu(sumhv, sumlv) ;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
375 vec_st(dstv, 0, (vector unsigned char *) dst);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
376
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
377 dst+=16;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
378 s+=16;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
379 dst_width-=16;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
380 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
381
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
382 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
383 If there are any leftover pixels, resample them
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
384 with the slow scalar method.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
385 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
386 while(dst_width>0) {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
387 sum = s[0 * wrap] * filter[0] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
388 s[1 * wrap] * filter[1] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
389 s[2 * wrap] * filter[2] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
390 s[3 * wrap] * filter[3];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
391 sum = sum >> FILTER_BITS;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
392 if (sum<0) sum = 0; else if (sum>255) sum=255;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
393 dst[0] = sum;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
394 dst++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
395 s++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
396 dst_width--;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
397 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
398 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
399 #endif
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
400
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
401 /* slow version to handle limit cases. Does not need optimisation */
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
402 static void h_resample_slow(uint8_t *dst, int dst_width,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
403 const uint8_t *src, int src_width,
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
404 int src_start, int src_incr, int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
405 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
406 int src_pos, phase, sum, j, v, i;
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
407 const uint8_t *s, *src_end;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
408 int16_t *filter;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
409
986e461dc072 Initial revision
glantau
parents:
diff changeset
410 src_end = src + src_width;
986e461dc072 Initial revision
glantau
parents:
diff changeset
411 src_pos = src_start;
986e461dc072 Initial revision
glantau
parents:
diff changeset
412 for(i=0;i<dst_width;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
413 s = src + (src_pos >> POS_FRAC_BITS);
986e461dc072 Initial revision
glantau
parents:
diff changeset
414 phase = get_phase(src_pos);
986e461dc072 Initial revision
glantau
parents:
diff changeset
415 filter = filters + phase * NB_TAPS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
416 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
417 for(j=0;j<NB_TAPS;j++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
418 if (s < src)
986e461dc072 Initial revision
glantau
parents:
diff changeset
419 v = src[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
420 else if (s >= src_end)
986e461dc072 Initial revision
glantau
parents:
diff changeset
421 v = src_end[-1];
986e461dc072 Initial revision
glantau
parents:
diff changeset
422 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
423 v = s[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
424 sum += v * filter[j];
986e461dc072 Initial revision
glantau
parents:
diff changeset
425 s++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
426 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
427 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
428 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
429 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
430 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
431 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
432 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
433 src_pos += src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
434 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
435 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
436 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
437
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
438 static void h_resample(uint8_t *dst, int dst_width, const uint8_t *src,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
439 int src_width, int src_start, int src_incr,
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
440 int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
441 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
442 int n, src_end;
986e461dc072 Initial revision
glantau
parents:
diff changeset
443
986e461dc072 Initial revision
glantau
parents:
diff changeset
444 if (src_start < 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
445 n = (0 - src_start + src_incr - 1) / src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
446 h_resample_slow(dst, n, src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
447 dst += n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
448 dst_width -= n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
449 src_start += n * src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
450 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
451 src_end = src_start + dst_width * src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
452 if (src_end > ((src_width - NB_TAPS) << POS_FRAC_BITS)) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
453 n = (((src_width - NB_TAPS + 1) << POS_FRAC_BITS) - 1 - src_start) /
986e461dc072 Initial revision
glantau
parents:
diff changeset
454 src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
455 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
456 n = dst_width;
986e461dc072 Initial revision
glantau
parents:
diff changeset
457 }
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
458 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
459 if ((mm_flags & MM_MMX) && NB_TAPS == 4)
986e461dc072 Initial revision
glantau
parents:
diff changeset
460 h_resample_fast4_mmx(dst, n,
986e461dc072 Initial revision
glantau
parents:
diff changeset
461 src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
462 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
463 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
464 h_resample_fast(dst, n,
986e461dc072 Initial revision
glantau
parents:
diff changeset
465 src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
466 if (n < dst_width) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
467 dst += n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
468 dst_width -= n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
469 src_start += n * src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
470 h_resample_slow(dst, dst_width,
986e461dc072 Initial revision
glantau
parents:
diff changeset
471 src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
472 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
473 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
474
986e461dc072 Initial revision
glantau
parents:
diff changeset
475 static void component_resample(ImgReSampleContext *s,
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
476 uint8_t *output, int owrap, int owidth, int oheight,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
477 uint8_t *input, int iwrap, int iwidth, int iheight)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
478 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
479 int src_y, src_y1, last_src_y, ring_y, phase_y, y1, y;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
480 uint8_t *new_line, *src_line;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
481
986e461dc072 Initial revision
glantau
parents:
diff changeset
482 last_src_y = - FCENTER - 1;
986e461dc072 Initial revision
glantau
parents:
diff changeset
483 /* position of the bottom of the filter in the source image */
986e461dc072 Initial revision
glantau
parents:
diff changeset
484 src_y = (last_src_y + NB_TAPS) * POS_FRAC;
986e461dc072 Initial revision
glantau
parents:
diff changeset
485 ring_y = NB_TAPS; /* position in ring buffer */
986e461dc072 Initial revision
glantau
parents:
diff changeset
486 for(y=0;y<oheight;y++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
487 /* apply horizontal filter on new lines from input if needed */
986e461dc072 Initial revision
glantau
parents:
diff changeset
488 src_y1 = src_y >> POS_FRAC_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
489 while (last_src_y < src_y1) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
490 if (++ring_y >= LINE_BUF_HEIGHT + NB_TAPS)
986e461dc072 Initial revision
glantau
parents:
diff changeset
491 ring_y = NB_TAPS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
492 last_src_y++;
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
493 /* handle limit conditions : replicate line (slightly
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
494 inefficient because we filter multiple times) */
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
495 y1 = last_src_y;
986e461dc072 Initial revision
glantau
parents:
diff changeset
496 if (y1 < 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
497 y1 = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
498 } else if (y1 >= iheight) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
499 y1 = iheight - 1;
986e461dc072 Initial revision
glantau
parents:
diff changeset
500 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
501 src_line = input + y1 * iwrap;
986e461dc072 Initial revision
glantau
parents:
diff changeset
502 new_line = s->line_buf + ring_y * owidth;
986e461dc072 Initial revision
glantau
parents:
diff changeset
503 /* apply filter and handle limit cases correctly */
986e461dc072 Initial revision
glantau
parents:
diff changeset
504 h_resample(new_line, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
505 src_line, iwidth, - FCENTER * POS_FRAC, s->h_incr,
986e461dc072 Initial revision
glantau
parents:
diff changeset
506 &s->h_filters[0][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
507 /* handle ring buffer wraping */
986e461dc072 Initial revision
glantau
parents:
diff changeset
508 if (ring_y >= LINE_BUF_HEIGHT) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
509 memcpy(s->line_buf + (ring_y - LINE_BUF_HEIGHT) * owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
510 new_line, owidth);
986e461dc072 Initial revision
glantau
parents:
diff changeset
511 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
512 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
513 /* apply vertical filter */
986e461dc072 Initial revision
glantau
parents:
diff changeset
514 phase_y = get_phase(src_y);
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
515 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
516 /* desactivated MMX because loss of precision */
986e461dc072 Initial revision
glantau
parents:
diff changeset
517 if ((mm_flags & MM_MMX) && NB_TAPS == 4 && 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
518 v_resample4_mmx(output, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
519 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
520 &s->v_filters[phase_y][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
521 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
522 #endif
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
523 #ifdef HAVE_ALTIVEC
920
a0ad8e3452f2 practically disabling altivec resampling code (some ppl said its broken) patch by (Dieter Shirley <dieters at schemasoft dot com>)
michaelni
parents: 898
diff changeset
524 if ((mm_flags & MM_ALTIVEC) && NB_TAPS == 4 && FILTER_BITS <= 6)
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
525 v_resample16_altivec(output, owidth,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
526 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
527 &s->v_filters[phase_y][0]);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
528 else
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
529 #endif
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
530 v_resample(output, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
531 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
532 &s->v_filters[phase_y][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
533
986e461dc072 Initial revision
glantau
parents:
diff changeset
534 src_y += s->v_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
535 output += owrap;
986e461dc072 Initial revision
glantau
parents:
diff changeset
536 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
537 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
538
986e461dc072 Initial revision
glantau
parents:
diff changeset
539 /* XXX: the following filter is quite naive, but it seems to suffice
986e461dc072 Initial revision
glantau
parents:
diff changeset
540 for 4 taps */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
541 static void build_filter(int16_t *filter, float factor)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
542 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
543 int ph, i, v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
544 float x, y, tab[NB_TAPS], norm, mult;
986e461dc072 Initial revision
glantau
parents:
diff changeset
545
986e461dc072 Initial revision
glantau
parents:
diff changeset
546 /* if upsampling, only need to interpolate, no filter */
986e461dc072 Initial revision
glantau
parents:
diff changeset
547 if (factor > 1.0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
548 factor = 1.0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
549
986e461dc072 Initial revision
glantau
parents:
diff changeset
550 for(ph=0;ph<NB_PHASES;ph++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
551 norm = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
552 for(i=0;i<NB_TAPS;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
553
986e461dc072 Initial revision
glantau
parents:
diff changeset
554 x = M_PI * ((float)(i - FCENTER) - (float)ph / NB_PHASES) * factor;
986e461dc072 Initial revision
glantau
parents:
diff changeset
555 if (x == 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
556 y = 1.0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
557 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
558 y = sin(x) / x;
986e461dc072 Initial revision
glantau
parents:
diff changeset
559 tab[i] = y;
986e461dc072 Initial revision
glantau
parents:
diff changeset
560 norm += y;
986e461dc072 Initial revision
glantau
parents:
diff changeset
561 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
562
986e461dc072 Initial revision
glantau
parents:
diff changeset
563 /* normalize so that an uniform color remains the same */
986e461dc072 Initial revision
glantau
parents:
diff changeset
564 mult = (float)(1 << FILTER_BITS) / norm;
986e461dc072 Initial revision
glantau
parents:
diff changeset
565 for(i=0;i<NB_TAPS;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
566 v = (int)(tab[i] * mult);
986e461dc072 Initial revision
glantau
parents:
diff changeset
567 filter[ph * NB_TAPS + i] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
568 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
569 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
570 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
571
986e461dc072 Initial revision
glantau
parents:
diff changeset
572 ImgReSampleContext *img_resample_init(int owidth, int oheight,
986e461dc072 Initial revision
glantau
parents:
diff changeset
573 int iwidth, int iheight)
986e461dc072 Initial revision
glantau
parents:
diff changeset
574 {
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
575 return img_resample_full_init(owidth, oheight, iwidth, iheight, 0, 0, 0, 0);
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
576 }
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
577
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
578 ImgReSampleContext *img_resample_full_init(int owidth, int oheight,
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
579 int iwidth, int iheight,
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
580 int topBand, int bottomBand,
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
581 int leftBand, int rightBand)
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
582 {
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
583 ImgReSampleContext *s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
584
986e461dc072 Initial revision
glantau
parents:
diff changeset
585 s = av_mallocz(sizeof(ImgReSampleContext));
986e461dc072 Initial revision
glantau
parents:
diff changeset
586 if (!s)
986e461dc072 Initial revision
glantau
parents:
diff changeset
587 return NULL;
986e461dc072 Initial revision
glantau
parents:
diff changeset
588 s->line_buf = av_mallocz(owidth * (LINE_BUF_HEIGHT + NB_TAPS));
986e461dc072 Initial revision
glantau
parents:
diff changeset
589 if (!s->line_buf)
986e461dc072 Initial revision
glantau
parents:
diff changeset
590 goto fail;
986e461dc072 Initial revision
glantau
parents:
diff changeset
591
986e461dc072 Initial revision
glantau
parents:
diff changeset
592 s->owidth = owidth;
986e461dc072 Initial revision
glantau
parents:
diff changeset
593 s->oheight = oheight;
986e461dc072 Initial revision
glantau
parents:
diff changeset
594 s->iwidth = iwidth;
986e461dc072 Initial revision
glantau
parents:
diff changeset
595 s->iheight = iheight;
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
596 s->topBand = topBand;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
597 s->bottomBand = bottomBand;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
598 s->leftBand = leftBand;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
599 s->rightBand = rightBand;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
600
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
601 s->h_incr = ((iwidth - leftBand - rightBand) * POS_FRAC) / owidth;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
602 s->v_incr = ((iheight - topBand - bottomBand) * POS_FRAC) / oheight;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
603
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
604 build_filter(&s->h_filters[0][0], (float) owidth / (float) (iwidth - leftBand - rightBand));
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
605 build_filter(&s->v_filters[0][0], (float) oheight / (float) (iheight - topBand - bottomBand));
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
606
986e461dc072 Initial revision
glantau
parents:
diff changeset
607 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
608 fail:
396
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
609 av_free(s);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
610 return NULL;
986e461dc072 Initial revision
glantau
parents:
diff changeset
611 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
612
986e461dc072 Initial revision
glantau
parents:
diff changeset
613 void img_resample(ImgReSampleContext *s,
1488
766a2f4edbea avcodec const correctness patch by (Drew Hess <dhess at ilm dot com>)
michaelni
parents: 1106
diff changeset
614 AVPicture *output, const AVPicture *input)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
615 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
616 int i, shift;
986e461dc072 Initial revision
glantau
parents:
diff changeset
617
986e461dc072 Initial revision
glantau
parents:
diff changeset
618 for(i=0;i<3;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
619 shift = (i == 0) ? 0 : 1;
986e461dc072 Initial revision
glantau
parents:
diff changeset
620 component_resample(s, output->data[i], output->linesize[i],
986e461dc072 Initial revision
glantau
parents:
diff changeset
621 s->owidth >> shift, s->oheight >> shift,
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
622 input->data[i] + (input->linesize[i] * (s->topBand >> shift)) + (s->leftBand >> shift),
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
623 input->linesize[i], ((s->iwidth - s->leftBand - s->rightBand) >> shift),
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
624 (s->iheight - s->topBand - s->bottomBand) >> shift);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
625 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
626 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
627
986e461dc072 Initial revision
glantau
parents:
diff changeset
628 void img_resample_close(ImgReSampleContext *s)
986e461dc072 Initial revision
glantau
parents:
diff changeset
629 {
396
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
630 av_free(s->line_buf);
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
631 av_free(s);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
632 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
633
986e461dc072 Initial revision
glantau
parents:
diff changeset
634 #ifdef TEST
986e461dc072 Initial revision
glantau
parents:
diff changeset
635
986e461dc072 Initial revision
glantau
parents:
diff changeset
636 void *av_mallocz(int size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
637 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
638 void *ptr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
639 ptr = malloc(size);
986e461dc072 Initial revision
glantau
parents:
diff changeset
640 memset(ptr, 0, size);
986e461dc072 Initial revision
glantau
parents:
diff changeset
641 return ptr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
642 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
643
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
644 void av_free(void *ptr)
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
645 {
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
646 /* XXX: this test should not be needed on most libcs */
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
647 if (ptr)
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
648 free(ptr);
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
649 }
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
650
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
651 /* input */
986e461dc072 Initial revision
glantau
parents:
diff changeset
652 #define XSIZE 256
986e461dc072 Initial revision
glantau
parents:
diff changeset
653 #define YSIZE 256
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
654 uint8_t img[XSIZE * YSIZE];
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
655
986e461dc072 Initial revision
glantau
parents:
diff changeset
656 /* output */
986e461dc072 Initial revision
glantau
parents:
diff changeset
657 #define XSIZE1 512
986e461dc072 Initial revision
glantau
parents:
diff changeset
658 #define YSIZE1 512
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
659 uint8_t img1[XSIZE1 * YSIZE1];
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
660 uint8_t img2[XSIZE1 * YSIZE1];
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
661
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
662 void save_pgm(const char *filename, uint8_t *img, int xsize, int ysize)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
663 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
664 FILE *f;
986e461dc072 Initial revision
glantau
parents:
diff changeset
665 f=fopen(filename,"w");
986e461dc072 Initial revision
glantau
parents:
diff changeset
666 fprintf(f,"P5\n%d %d\n%d\n", xsize, ysize, 255);
986e461dc072 Initial revision
glantau
parents:
diff changeset
667 fwrite(img,1, xsize * ysize,f);
986e461dc072 Initial revision
glantau
parents:
diff changeset
668 fclose(f);
986e461dc072 Initial revision
glantau
parents:
diff changeset
669 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
670
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
671 static void dump_filter(int16_t *filter)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
672 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
673 int i, ph;
986e461dc072 Initial revision
glantau
parents:
diff changeset
674
986e461dc072 Initial revision
glantau
parents:
diff changeset
675 for(ph=0;ph<NB_PHASES;ph++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
676 printf("%2d: ", ph);
986e461dc072 Initial revision
glantau
parents:
diff changeset
677 for(i=0;i<NB_TAPS;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
678 printf(" %5.2f", filter[ph * NB_TAPS + i] / 256.0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
679 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
680 printf("\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
681 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
682 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
683
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
684 #ifdef HAVE_MMX
644
641708b5c33c fixing tests
michaelni
parents: 630
diff changeset
685 int mm_flags;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
686 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
687
986e461dc072 Initial revision
glantau
parents:
diff changeset
688 int main(int argc, char **argv)
986e461dc072 Initial revision
glantau
parents:
diff changeset
689 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
690 int x, y, v, i, xsize, ysize;
986e461dc072 Initial revision
glantau
parents:
diff changeset
691 ImgReSampleContext *s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
692 float fact, factors[] = { 1/2.0, 3.0/4.0, 1.0, 4.0/3.0, 16.0/9.0, 2.0 };
986e461dc072 Initial revision
glantau
parents:
diff changeset
693 char buf[256];
986e461dc072 Initial revision
glantau
parents:
diff changeset
694
986e461dc072 Initial revision
glantau
parents:
diff changeset
695 /* build test image */
986e461dc072 Initial revision
glantau
parents:
diff changeset
696 for(y=0;y<YSIZE;y++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
697 for(x=0;x<XSIZE;x++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
698 if (x < XSIZE/2 && y < YSIZE/2) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
699 if (x < XSIZE/4 && y < YSIZE/4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
700 if ((x % 10) <= 6 &&
986e461dc072 Initial revision
glantau
parents:
diff changeset
701 (y % 10) <= 6)
986e461dc072 Initial revision
glantau
parents:
diff changeset
702 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
703 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
704 v = 0x00;
986e461dc072 Initial revision
glantau
parents:
diff changeset
705 } else if (x < XSIZE/4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
706 if (x & 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
707 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
708 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
709 v = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
710 } else if (y < XSIZE/4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
711 if (y & 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
712 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
713 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
714 v = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
715 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
716 if (y < YSIZE*3/8) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
717 if ((y+x) & 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
718 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
719 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
720 v = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
721 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
722 if (((x+3) % 4) <= 1 &&
986e461dc072 Initial revision
glantau
parents:
diff changeset
723 ((y+3) % 4) <= 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
724 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
725 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
726 v = 0x00;
986e461dc072 Initial revision
glantau
parents:
diff changeset
727 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
728 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
729 } else if (x < XSIZE/2) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
730 v = ((x - (XSIZE/2)) * 255) / (XSIZE/2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
731 } else if (y < XSIZE/2) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
732 v = ((y - (XSIZE/2)) * 255) / (XSIZE/2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
733 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
734 v = ((x + y - XSIZE) * 255) / XSIZE;
986e461dc072 Initial revision
glantau
parents:
diff changeset
735 }
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
736 img[(YSIZE - y) * XSIZE + (XSIZE - x)] = v;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
737 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
738 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
739 save_pgm("/tmp/in.pgm", img, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
740 for(i=0;i<sizeof(factors)/sizeof(float);i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
741 fact = factors[i];
986e461dc072 Initial revision
glantau
parents:
diff changeset
742 xsize = (int)(XSIZE * fact);
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
743 ysize = (int)((YSIZE - 100) * fact);
644
641708b5c33c fixing tests
michaelni
parents: 630
diff changeset
744 s = img_resample_full_init(xsize, ysize, XSIZE, YSIZE, 50 ,50, 0, 0);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
745 printf("Factor=%0.2f\n", fact);
986e461dc072 Initial revision
glantau
parents:
diff changeset
746 dump_filter(&s->h_filters[0][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
747 component_resample(s, img1, xsize, xsize, ysize,
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
748 img + 50 * XSIZE, XSIZE, XSIZE, YSIZE - 100);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
749 img_resample_close(s);
986e461dc072 Initial revision
glantau
parents:
diff changeset
750
986e461dc072 Initial revision
glantau
parents:
diff changeset
751 sprintf(buf, "/tmp/out%d.pgm", i);
986e461dc072 Initial revision
glantau
parents:
diff changeset
752 save_pgm(buf, img1, xsize, ysize);
986e461dc072 Initial revision
glantau
parents:
diff changeset
753 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
754
986e461dc072 Initial revision
glantau
parents:
diff changeset
755 /* mmx test */
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
756 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
757 printf("MMX test\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
758 fact = 0.72;
986e461dc072 Initial revision
glantau
parents:
diff changeset
759 xsize = (int)(XSIZE * fact);
986e461dc072 Initial revision
glantau
parents:
diff changeset
760 ysize = (int)(YSIZE * fact);
986e461dc072 Initial revision
glantau
parents:
diff changeset
761 mm_flags = MM_MMX;
986e461dc072 Initial revision
glantau
parents:
diff changeset
762 s = img_resample_init(xsize, ysize, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
763 component_resample(s, img1, xsize, xsize, ysize,
986e461dc072 Initial revision
glantau
parents:
diff changeset
764 img, XSIZE, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
765
986e461dc072 Initial revision
glantau
parents:
diff changeset
766 mm_flags = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
767 s = img_resample_init(xsize, ysize, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
768 component_resample(s, img2, xsize, xsize, ysize,
986e461dc072 Initial revision
glantau
parents:
diff changeset
769 img, XSIZE, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
770 if (memcmp(img1, img2, xsize * ysize) != 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
771 fprintf(stderr, "mmx error\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
772 exit(1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
773 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
774 printf("MMX OK\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
775 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
776 return 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
777 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
778
986e461dc072 Initial revision
glantau
parents:
diff changeset
779 #endif