Mercurial > libavcodec.hg
annotate dv.c @ 8168:0dcd9d4dd87f libavcodec
SH4: replace missed rnd_avg2 -> rnd_avg32
| author | mru |
|---|---|
| date | Wed, 19 Nov 2008 00:37:17 +0000 |
| parents | ab31736c0f23 |
| children | 471b16105266 |
| rev | line source |
|---|---|
| 723 | 1 /* |
| 2 * DV decoder | |
| 3 * Copyright (c) 2002 Fabrice Bellard. | |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
4 * Copyright (c) 2004 Roman Shaposhnik. |
| 723 | 5 * |
| 2967 | 6 * DV encoder |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
7 * Copyright (c) 2003 Roman Shaposhnik. |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
8 * |
| 3167 | 9 * 50 Mbps (DVCPRO50) support |
| 10 * Copyright (c) 2006 Daniel Maas <dmaas@maasdigital.com> | |
| 11 * | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
12 * 100 Mbps (DVCPRO HD) support |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
13 * Initial code by Daniel Maas <dmaas@maasdigital.com> (funded by BBC R&D) |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
14 * Final code by Roman Shaposhnik |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
15 * |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
16 * Many thanks to Dan Dennedy <dan@dennedy.org> for providing wealth |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
17 * of DV technical info. |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
18 * |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
19 * This file is part of FFmpeg. |
|
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
20 * |
|
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
21 * FFmpeg is free software; you can redistribute it and/or |
| 723 | 22 * modify it under the terms of the GNU Lesser General Public |
| 23 * License as published by the Free Software Foundation; either | |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
24 * version 2.1 of the License, or (at your option) any later version. |
| 723 | 25 * |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
26 * FFmpeg is distributed in the hope that it will be useful, |
| 723 | 27 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 28 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
| 29 * Lesser General Public License for more details. | |
| 30 * | |
| 31 * You should have received a copy of the GNU Lesser General Public | |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
32 * License along with FFmpeg; if not, write to the Free Software |
|
3036
0b546eab515d
Update licensing information: The FSF changed postal address.
diego
parents:
3016
diff
changeset
|
33 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| 723 | 34 */ |
| 1106 | 35 |
| 36 /** | |
| 37 * @file dv.c | |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
38 * DV codec. |
| 1106 | 39 */ |
| 3649 | 40 #define ALT_BITSTREAM_READER |
| 723 | 41 #include "avcodec.h" |
| 42 #include "dsputil.h" | |
| 6450 | 43 #include "bitstream.h" |
| 723 | 44 #include "simple_idct.h" |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
45 #include "dvdata.h" |
| 723 | 46 |
| 2847 | 47 //#undef NDEBUG |
| 48 //#include <assert.h> | |
| 49 | |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
50 typedef struct DVVideoContext { |
| 8051 | 51 const DVprofile *sys; |
| 52 AVFrame picture; | |
| 53 AVCodecContext *avctx; | |
| 54 uint8_t *buf; | |
| 2967 | 55 |
| 8051 | 56 uint8_t dv_zigzag[2][64]; |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
57 uint32_t dv_idct_factor[2][2][22][64]; |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
58 uint32_t dv100_idct_factor[4][4][16][64]; |
| 2967 | 59 |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
60 void (*get_pixels)(DCTELEM *block, const uint8_t *pixels, int line_size); |
| 1567 | 61 void (*fdct[2])(DCTELEM *block); |
| 62 void (*idct_put[2])(uint8_t *dest, int line_size, DCTELEM *block); | |
|
3016
97e6c0f82182
Moving dv_anchor back to the global scope. This creates a tiny memory
romansh
parents:
2991
diff
changeset
|
63 } DVVideoContext; |
|
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
64 |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
65 #define TEX_VLC_BITS 9 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
66 |
|
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
67 #if ENABLE_SMALL |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
68 #define DV_VLC_MAP_RUN_SIZE 15 |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
69 #define DV_VLC_MAP_LEV_SIZE 23 |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
70 #else |
| 2967 | 71 #define DV_VLC_MAP_RUN_SIZE 64 |
| 2847 | 72 #define DV_VLC_MAP_LEV_SIZE 512 //FIXME sign was removed so this should be /2 but needs check |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
73 #endif |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
74 |
| 723 | 75 /* XXX: also include quantization */ |
| 4661 | 76 static RL_VLC_ELEM dv_rl_vlc[1184]; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
77 /* VLC encoding lookup table */ |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
78 static struct dv_vlc_pair { |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
79 uint32_t vlc; |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
80 uint8_t size; |
| 4666 | 81 } dv_vlc_map[DV_VLC_MAP_RUN_SIZE][DV_VLC_MAP_LEV_SIZE]; |
| 723 | 82 |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
83 static inline int dv_work_pool_size(const DVprofile *d) |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
84 { |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
85 int size = d->n_difchan*d->difseg_size*27; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
86 if (DV_PROFILE_IS_1080i50(d)) |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
87 size -= 3*27; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
88 if (DV_PROFILE_IS_720p50(d)) |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
89 size -= 4*27; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
90 return size; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
91 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
92 |
| 8164 | 93 static inline void dv_calc_mb_coordinates(const DVprofile *d, int chan, int seq, int slot, |
| 94 uint16_t *tbl) | |
| 95 { | |
| 96 const static uint8_t off[] = { 2, 6, 8, 0, 4 }; | |
| 97 const static uint8_t shuf1[] = { 36, 18, 54, 0, 72 }; | |
| 98 const static uint8_t shuf2[] = { 24, 12, 36, 0, 48 }; | |
| 99 const static uint8_t shuf3[] = { 18, 9, 27, 0, 36 }; | |
| 100 | |
| 101 const static uint8_t l_start[] = {0, 4, 9, 13, 18, 22, 27, 31, 36, 40}; | |
| 102 const static uint8_t l_start_shuffled[] = { 9, 4, 13, 0, 18 }; | |
| 103 | |
| 104 const static uint8_t serpent1[] = {0, 1, 2, 2, 1, 0, | |
| 105 0, 1, 2, 2, 1, 0, | |
| 106 0, 1, 2, 2, 1, 0, | |
| 107 0, 1, 2, 2, 1, 0, | |
| 108 0, 1, 2}; | |
| 109 const static uint8_t serpent2[] = {0, 1, 2, 3, 4, 5, 5, 4, 3, 2, 1, 0, | |
| 110 0, 1, 2, 3, 4, 5, 5, 4, 3, 2, 1, 0, | |
| 111 0, 1, 2, 3, 4, 5}; | |
| 112 | |
| 113 const static uint8_t remap[][2] = {{ 0, 0}, { 0, 0}, { 0, 0}, { 0, 0}, /* dummy */ | |
| 114 { 0, 0}, { 0, 1}, { 0, 2}, { 0, 3}, {10, 0}, | |
| 115 {10, 1}, {10, 2}, {10, 3}, {20, 0}, {20, 1}, | |
| 116 {20, 2}, {20, 3}, {30, 0}, {30, 1}, {30, 2}, | |
| 117 {30, 3}, {40, 0}, {40, 1}, {40, 2}, {40, 3}, | |
| 118 {50, 0}, {50, 1}, {50, 2}, {50, 3}, {60, 0}, | |
| 119 {60, 1}, {60, 2}, {60, 3}, {70, 0}, {70, 1}, | |
| 120 {70, 2}, {70, 3}, { 0,64}, { 0,65}, { 0,66}, | |
| 121 {10,64}, {10,65}, {10,66}, {20,64}, {20,65}, | |
| 122 {20,66}, {30,64}, {30,65}, {30,66}, {40,64}, | |
| 123 {40,65}, {40,66}, {50,64}, {50,65}, {50,66}, | |
| 124 {60,64}, {60,65}, {60,66}, {70,64}, {70,65}, | |
| 125 {70,66}, { 0,67}, {20,67}, {40,67}, {60,67}}; | |
| 126 | |
| 127 int i, k, m; | |
| 128 int x, y, blk; | |
| 129 | |
| 130 for (m=0; m<5; m++) { | |
| 131 switch (d->width) { | |
| 132 case 1440: | |
| 133 blk = (chan*11+seq)*27+slot; | |
| 134 | |
| 135 if (chan == 0 && seq == 11) { | |
| 136 x = m*27+slot; | |
| 137 if (x<90) { | |
| 138 y = 0; | |
| 139 } else { | |
| 140 x = (x - 90)*2; | |
| 141 y = 67; | |
| 142 } | |
| 143 } else { | |
| 144 i = (4*chan + blk + off[m])%11; | |
| 145 k = (blk/11)%27; | |
| 146 | |
| 147 x = shuf1[m] + (chan&1)*9 + k%9; | |
| 148 y = (i*3+k/9)*2 + (chan>>1) + 1; | |
| 149 } | |
| 150 tbl[m] = (x<<1)|(y<<9); | |
| 151 break; | |
| 152 case 1280: | |
| 153 blk = (chan*10+seq)*27+slot; | |
| 154 | |
| 155 i = (4*chan + (seq/5) + 2*blk + off[m])%10; | |
| 156 k = (blk/5)%27; | |
| 157 | |
| 158 x = shuf1[m]+(chan&1)*9 + k%9; | |
| 159 y = (i*3+k/9)*2 + (chan>>1) + 4; | |
| 160 | |
| 161 if (x >= 80) { | |
| 162 x = remap[y][0]+((x-80)<<(y>59)); | |
| 163 y = remap[y][1]; | |
| 164 } | |
| 165 tbl[m] = (x<<1)|(y<<9); | |
| 166 break; | |
| 167 case 960: | |
| 168 blk = (chan*10+seq)*27+slot; | |
| 169 | |
| 170 i = (4*chan + (seq/5) + 2*blk + off[m])%10; | |
| 171 k = (blk/5)%27 + (i&1)*3; | |
| 172 | |
| 173 x = shuf2[m] + k%6 + 6*(chan&1); | |
| 174 y = l_start[i] + k/6 + 45*(chan>>1); | |
| 175 tbl[m] = (x<<1)|(y<<9); | |
| 176 break; | |
| 177 case 720: | |
| 178 switch (d->pix_fmt) { | |
| 179 case PIX_FMT_YUV422P: | |
| 180 x = shuf3[m] + slot/3; | |
| 181 y = serpent1[slot] + | |
| 182 ((((seq + off[m]) % d->difseg_size)<<1) + chan)*3; | |
| 183 tbl[m] = (x<<1)|(y<<8); | |
| 184 break; | |
| 185 case PIX_FMT_YUV420P: | |
| 186 x = shuf3[m] + slot/3; | |
| 187 y = serpent1[slot] + | |
| 188 ((seq + off[m]) % d->difseg_size)*3; | |
| 189 tbl[m] = (x<<1)|(y<<9); | |
| 190 break; | |
| 191 case PIX_FMT_YUV411P: | |
| 192 i = (seq + off[m]) % d->difseg_size; | |
| 193 k = slot + ((m==1||m==2)?3:0); | |
| 194 | |
| 195 x = l_start_shuffled[m] + k/6; | |
| 196 y = serpent2[k] + i*6; | |
| 197 if (x>21) | |
| 198 y = y*2 - i*6; | |
| 199 tbl[m] = (x<<2)|(y<<8); | |
| 200 break; | |
| 201 } | |
| 202 default: | |
| 203 break; | |
| 204 } | |
| 205 } | |
| 206 } | |
| 207 | |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
208 static int dv_init_dynamic_tables(const DVprofile *d) |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
209 { |
| 8164 | 210 int j,i,c,s,p; |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
211 |
| 8131 | 212 if (d->work_chunks[dv_work_pool_size(d)-1].buf_offset) |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
213 return 0; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
214 |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
215 p = i = 0; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
216 for (c=0; c<d->n_difchan; c++) { |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
217 for (s=0; s<d->difseg_size; s++) { |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
218 p += 6; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
219 for (j=0; j<27; j++) { |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
220 p += !(j%3); |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
221 if (!(DV_PROFILE_IS_1080i50(d) && c != 0 && s == 11) && |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
222 !(DV_PROFILE_IS_720p50(d) && s > 9)) { |
| 8164 | 223 dv_calc_mb_coordinates(d, c, s, j, &d->work_chunks[i].mb_coordinates[0]); |
| 8131 | 224 d->work_chunks[i++].buf_offset = p; |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
225 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
226 p += 5; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
227 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
228 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
229 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
230 return 0; |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
231 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
232 |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
233 static void dv_build_unquantize_tables(DVVideoContext *s, uint8_t* perm) |
| 723 | 234 { |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
235 int i, q, a; |
| 723 | 236 |
| 237 /* NOTE: max left shift is 6 */ | |
| 8051 | 238 for (q = 0; q < 22; q++) { |
| 1567 | 239 /* 88DCT */ |
| 8051 | 240 i = 1; |
| 241 for (a = 0; a < 4; a++) { | |
| 242 for (; i < dv_quant_areas[a]; i++) { | |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
243 /* 88 table */ |
| 8051 | 244 s->dv_idct_factor[0][0][q][i] = dv_iweight_88[i] << (dv_quant_shifts[q][a] + 1); |
| 245 s->dv_idct_factor[1][0][q][i] = s->dv_idct_factor[0][0][q][i] << 1; | |
| 2967 | 246 |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
247 /* 248 table */ |
| 8051 | 248 s->dv_idct_factor[0][1][q][i] = dv_iweight_248[i] << (dv_quant_shifts[q][a] + 1); |
| 249 s->dv_idct_factor[1][1][q][i] = s->dv_idct_factor[0][1][q][i] << 1; | |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
250 } |
| 723 | 251 } |
| 252 } | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
253 |
| 8051 | 254 for (a = 0; a < 4; a++) { |
| 255 for (q = 0; q < 16; q++) { | |
| 256 for (i = 1; i < 64; i++) { | |
| 257 s->dv100_idct_factor[0][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_1080_y[i]; | |
| 258 s->dv100_idct_factor[1][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_1080_c[i]; | |
| 259 s->dv100_idct_factor[2][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_720_y[i]; | |
| 260 s->dv100_idct_factor[3][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_720_c[i]; | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
261 } |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
262 } |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
263 } |
| 723 | 264 } |
| 265 | |
|
6517
48759bfbd073
Apply 'cold' attribute to init/uninit functions in libavcodec
zuxy
parents:
6450
diff
changeset
|
266 static av_cold int dvvideo_init(AVCodecContext *avctx) |
| 723 | 267 { |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
268 DVVideoContext *s = avctx->priv_data; |
| 1567 | 269 DSPContext dsp; |
| 8051 | 270 static int done = 0; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
271 int i, j; |
| 723 | 272 |
| 273 if (!done) { | |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
274 VLC dv_vlc; |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
275 uint16_t new_dv_vlc_bits[NB_DV_VLC*2]; |
| 8051 | 276 uint8_t new_dv_vlc_len[NB_DV_VLC*2]; |
| 277 uint8_t new_dv_vlc_run[NB_DV_VLC*2]; | |
| 278 int16_t new_dv_vlc_level[NB_DV_VLC*2]; | |
| 723 | 279 |
| 280 done = 1; | |
| 281 | |
| 2979 | 282 /* it's faster to include sign bit in a generic VLC parsing scheme */ |
| 8051 | 283 for (i = 0, j = 0; i < NB_DV_VLC; i++, j++) { |
| 284 new_dv_vlc_bits[j] = dv_vlc_bits[i]; | |
| 285 new_dv_vlc_len[j] = dv_vlc_len[i]; | |
| 286 new_dv_vlc_run[j] = dv_vlc_run[i]; | |
| 2979 | 287 new_dv_vlc_level[j] = dv_vlc_level[i]; |
| 2967 | 288 |
| 2979 | 289 if (dv_vlc_level[i]) { |
| 290 new_dv_vlc_bits[j] <<= 1; | |
| 291 new_dv_vlc_len[j]++; | |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
292 |
| 2979 | 293 j++; |
| 8051 | 294 new_dv_vlc_bits[j] = (dv_vlc_bits[i] << 1) | 1; |
| 295 new_dv_vlc_len[j] = dv_vlc_len[i] + 1; | |
| 296 new_dv_vlc_run[j] = dv_vlc_run[i]; | |
| 2979 | 297 new_dv_vlc_level[j] = -dv_vlc_level[i]; |
| 298 } | |
| 299 } | |
| 2967 | 300 |
| 723 | 301 /* NOTE: as a trick, we use the fact the no codes are unused |
| 302 to accelerate the parsing of partial codes */ | |
| 2967 | 303 init_vlc(&dv_vlc, TEX_VLC_BITS, j, |
|
2370
26560d4fdb1f
Memory leak fix patch by (Burkhard Plaum <plaum >at< ipf.uni-stuttgart )dot( de>)
michael
parents:
2247
diff
changeset
|
304 new_dv_vlc_len, 1, 1, new_dv_vlc_bits, 2, 2, 0); |
| 4661 | 305 assert(dv_vlc.table_size == 1184); |
|
3016
97e6c0f82182
Moving dv_anchor back to the global scope. This creates a tiny memory
romansh
parents:
2991
diff
changeset
|
306 |
| 8051 | 307 for (i = 0; i < dv_vlc.table_size; i++){ |
| 308 int code = dv_vlc.table[i][0]; | |
| 309 int len = dv_vlc.table[i][1]; | |
| 723 | 310 int level, run; |
| 2967 | 311 |
| 8051 | 312 if (len < 0){ //more bits needed |
| 313 run = 0; | |
| 314 level = code; | |
| 723 | 315 } else { |
| 8051 | 316 run = new_dv_vlc_run [code] + 1; |
| 317 level = new_dv_vlc_level[code]; | |
| 723 | 318 } |
| 8051 | 319 dv_rl_vlc[i].len = len; |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
320 dv_rl_vlc[i].level = level; |
| 8051 | 321 dv_rl_vlc[i].run = run; |
| 723 | 322 } |
| 2979 | 323 free_vlc(&dv_vlc); |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
324 |
| 2979 | 325 for (i = 0; i < NB_DV_VLC - 1; i++) { |
|
2027
3a78447c3b53
oops, forgot to commit that change from the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1994
diff
changeset
|
326 if (dv_vlc_run[i] >= DV_VLC_MAP_RUN_SIZE) |
| 2979 | 327 continue; |
|
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
328 #if ENABLE_SMALL |
|
2027
3a78447c3b53
oops, forgot to commit that change from the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1994
diff
changeset
|
329 if (dv_vlc_level[i] >= DV_VLC_MAP_LEV_SIZE) |
| 2979 | 330 continue; |
|
2027
3a78447c3b53
oops, forgot to commit that change from the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1994
diff
changeset
|
331 #endif |
| 2967 | 332 |
| 2979 | 333 if (dv_vlc_map[dv_vlc_run[i]][dv_vlc_level[i]].size != 0) |
| 334 continue; | |
| 2967 | 335 |
| 8051 | 336 dv_vlc_map[dv_vlc_run[i]][dv_vlc_level[i]].vlc = |
| 337 dv_vlc_bits[i] << (!!dv_vlc_level[i]); | |
| 338 dv_vlc_map[dv_vlc_run[i]][dv_vlc_level[i]].size = | |
| 339 dv_vlc_len[i] + (!!dv_vlc_level[i]); | |
| 2979 | 340 } |
| 341 for (i = 0; i < DV_VLC_MAP_RUN_SIZE; i++) { | |
|
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
342 #if ENABLE_SMALL |
| 2979 | 343 for (j = 1; j < DV_VLC_MAP_LEV_SIZE; j++) { |
| 344 if (dv_vlc_map[i][j].size == 0) { | |
| 345 dv_vlc_map[i][j].vlc = dv_vlc_map[0][j].vlc | | |
| 346 (dv_vlc_map[i-1][0].vlc << (dv_vlc_map[0][j].size)); | |
| 347 dv_vlc_map[i][j].size = dv_vlc_map[i-1][0].size + | |
| 348 dv_vlc_map[0][j].size; | |
| 349 } | |
| 350 } | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
351 #else |
| 2979 | 352 for (j = 1; j < DV_VLC_MAP_LEV_SIZE/2; j++) { |
| 353 if (dv_vlc_map[i][j].size == 0) { | |
| 354 dv_vlc_map[i][j].vlc = dv_vlc_map[0][j].vlc | | |
| 355 (dv_vlc_map[i-1][0].vlc << (dv_vlc_map[0][j].size)); | |
| 356 dv_vlc_map[i][j].size = dv_vlc_map[i-1][0].size + | |
| 357 dv_vlc_map[0][j].size; | |
| 358 } | |
| 359 dv_vlc_map[i][((uint16_t)(-j))&0x1ff].vlc = | |
| 360 dv_vlc_map[i][j].vlc | 1; | |
| 361 dv_vlc_map[i][((uint16_t)(-j))&0x1ff].size = | |
| 362 dv_vlc_map[i][j].size; | |
| 363 } | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
364 #endif |
| 2979 | 365 } |
| 723 | 366 } |
| 725 | 367 |
| 1567 | 368 /* Generic DSP setup */ |
| 369 dsputil_init(&dsp, avctx); | |
| 370 s->get_pixels = dsp.get_pixels; | |
| 725 | 371 |
| 1567 | 372 /* 88DCT setup */ |
| 8051 | 373 s->fdct[0] = dsp.fdct; |
| 1567 | 374 s->idct_put[0] = dsp.idct_put; |
| 8051 | 375 for (i = 0; i < 64; i++) |
| 1567 | 376 s->dv_zigzag[0][i] = dsp.idct_permutation[ff_zigzag_direct[i]]; |
| 725 | 377 |
| 1567 | 378 /* 248DCT setup */ |
| 8051 | 379 s->fdct[1] = dsp.fdct248; |
| 6001 | 380 s->idct_put[1] = ff_simple_idct248_put; // FIXME: need to add it to DSP |
| 8051 | 381 if (avctx->lowres){ |
| 382 for (i = 0; i < 64; i++){ | |
| 383 int j = ff_zigzag248_direct[i]; | |
| 384 s->dv_zigzag[1][i] = dsp.idct_permutation[(j & 7) + (j & 8) * 4 + (j & 48) / 2]; | |
| 2849 | 385 } |
| 386 }else | |
| 387 memcpy(s->dv_zigzag[1], ff_zigzag248_direct, 64); | |
| 725 | 388 |
| 723 | 389 /* XXX: do it only for constant case */ |
| 1567 | 390 dv_build_unquantize_tables(s, dsp.idct_permutation); |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
391 |
|
1543
7542cb99b950
* providing MPEG codecs with a generic fields in AVFrame to use.
romansh
parents:
1540
diff
changeset
|
392 avctx->coded_frame = &s->picture; |
| 8051 | 393 s->avctx = avctx; |
| 2967 | 394 |
| 723 | 395 return 0; |
| 396 } | |
| 397 | |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
398 // #define VLC_DEBUG |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
399 // #define printf(...) av_log(NULL, AV_LOG_ERROR, __VA_ARGS__) |
| 723 | 400 |
| 725 | 401 typedef struct BlockInfo { |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
402 const uint32_t *factor_table; |
| 1064 | 403 const uint8_t *scan_table; |
| 404 uint8_t pos; /* position in block */ | |
| 7706 | 405 void (*idct_put)(uint8_t *dest, int line_size, DCTELEM *block); |
| 1064 | 406 uint8_t partial_bit_count; |
| 407 uint16_t partial_bit_buffer; | |
| 725 | 408 int shift_offset; |
| 409 } BlockInfo; | |
| 723 | 410 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
411 /* bit budget for AC only in 5 MBs */ |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
412 static const int vs_total_ac_bits = (100 * 4 + 68*2) * 5; |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
413 /* see dv_88_areas and dv_248_areas for details */ |
| 2967 | 414 static const int mb_area_start[5] = { 1, 6, 21, 43, 64 }; |
| 723 | 415 |
|
1895
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
416 static inline int get_bits_left(GetBitContext *s) |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
417 { |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
418 return s->size_in_bits - get_bits_count(s); |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
419 } |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
420 |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
421 static inline int put_bits_left(PutBitContext* s) |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
422 { |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
423 return (s->buf_end - s->buf) * 8 - put_bits_count(s); |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
424 } |
|
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
425 |
| 7980 | 426 /* decode ac coefficients */ |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
427 static void dv_decode_ac(GetBitContext *gb, BlockInfo *mb, DCTELEM *block) |
| 723 | 428 { |
| 7039 | 429 int last_index = gb->size_in_bits; |
| 8051 | 430 const uint8_t *scan_table = mb->scan_table; |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
431 const uint32_t *factor_table = mb->factor_table; |
| 8051 | 432 int pos = mb->pos; |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
433 int partial_bit_count = mb->partial_bit_count; |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
434 int level, run, vlc_len, index; |
| 2967 | 435 |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
436 OPEN_READER(re, gb); |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
437 UPDATE_CACHE(re, gb); |
| 2967 | 438 |
| 723 | 439 /* if we must parse a partial vlc, we do it here */ |
| 440 if (partial_bit_count > 0) { | |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
441 re_cache = ((unsigned)re_cache >> partial_bit_count) | |
| 8051 | 442 (mb->partial_bit_buffer << (sizeof(re_cache) * 8 - partial_bit_count)); |
| 2979 | 443 re_index -= partial_bit_count; |
| 444 mb->partial_bit_count = 0; | |
| 723 | 445 } |
| 446 | |
| 447 /* get the AC coefficients until last_index is reached */ | |
| 8051 | 448 for (;;) { |
| 723 | 449 #ifdef VLC_DEBUG |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
450 printf("%2d: bits=%04x index=%d\n", pos, SHOW_UBITS(re, gb, 16), re_index); |
| 723 | 451 #endif |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
452 /* our own optimized GET_RL_VLC */ |
| 8051 | 453 index = NEG_USR32(re_cache, TEX_VLC_BITS); |
| 2979 | 454 vlc_len = dv_rl_vlc[index].len; |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
455 if (vlc_len < 0) { |
|
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
456 index = NEG_USR32((unsigned)re_cache << TEX_VLC_BITS, -vlc_len) + dv_rl_vlc[index].level; |
|
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
457 vlc_len = TEX_VLC_BITS - vlc_len; |
|
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
458 } |
|
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
459 level = dv_rl_vlc[index].level; |
| 8051 | 460 run = dv_rl_vlc[index].run; |
| 2967 | 461 |
| 2979 | 462 /* gotta check if we're still within gb boundaries */ |
| 463 if (re_index + vlc_len > last_index) { | |
| 464 /* should be < 16 bits otherwise a codeword could have been parsed */ | |
| 465 mb->partial_bit_count = last_index - re_index; | |
| 466 mb->partial_bit_buffer = NEG_USR32(re_cache, mb->partial_bit_count); | |
| 467 re_index = last_index; | |
| 468 break; | |
| 469 } | |
| 470 re_index += vlc_len; | |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
471 |
|
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
472 #ifdef VLC_DEBUG |
| 2979 | 473 printf("run=%d level=%d\n", run, level); |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
474 #endif |
| 2979 | 475 pos += run; |
| 476 if (pos >= 64) | |
| 477 break; | |
| 2967 | 478 |
| 8051 | 479 level = (level * factor_table[pos] + (1 << (dv_iweight_bits - 1))) >> dv_iweight_bits; |
|
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
480 block[scan_table[pos]] = level; |
|
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
481 |
|
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
482 UPDATE_CACHE(re, gb); |
| 723 | 483 } |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
484 CLOSE_READER(re, gb); |
| 725 | 485 mb->pos = pos; |
| 723 | 486 } |
| 487 | |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
488 static inline void bit_copy(PutBitContext *pb, GetBitContext *gb) |
| 723 | 489 { |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
490 int bits_left = get_bits_left(gb); |
| 2847 | 491 while (bits_left >= MIN_CACHE_BITS) { |
| 492 put_bits(pb, MIN_CACHE_BITS, get_bits(gb, MIN_CACHE_BITS)); | |
| 493 bits_left -= MIN_CACHE_BITS; | |
| 723 | 494 } |
| 495 if (bits_left > 0) { | |
| 496 put_bits(pb, bits_left, get_bits(gb, bits_left)); | |
| 497 } | |
| 498 } | |
| 499 | |
| 8131 | 500 static inline void dv_calculate_mb_xy(DVVideoContext *s, DVwork_chunk *work_chunk, int m, int *mb_x, int *mb_y) |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
501 { |
| 8131 | 502 *mb_x = work_chunk->mb_coordinates[m] & 0xff; |
| 503 *mb_y = work_chunk->mb_coordinates[m] >> 8; | |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
504 |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
505 /* We work with 720p frames split in half. The odd half-frame (chan==2,3) is displaced :-( */ |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
506 if (s->sys->height == 720 && !(s->buf[1]&0x0C)) { |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
507 *mb_y -= (*mb_y>17)?18:-72; /* shifting the Y coordinate down by 72/2 macro blocks */ |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
508 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
509 } |
|
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
510 |
| 723 | 511 /* mb_x and mb_y are in units of 8 pixels */ |
| 8163 | 512 static int dv_decode_video_segment(AVCodecContext *avctx, DVwork_chunk *work_chunk) |
| 723 | 513 { |
| 8163 | 514 DVVideoContext *s = avctx->priv_data; |
| 723 | 515 int quant, dc, dct_mode, class1, j; |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
516 int mb_index, mb_x, mb_y, last_index; |
| 8011 | 517 int y_stride, linesize; |
| 723 | 518 DCTELEM *block, *block1; |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
519 int c_offset; |
| 1064 | 520 uint8_t *y_ptr; |
| 6266 | 521 const uint8_t *buf_ptr; |
| 723 | 522 PutBitContext pb, vs_pb; |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
523 GetBitContext gb; |
|
7614
1afa1171b7b2
Introducing DV_MAX_BPM macro instead of a hardcoded value for the
romansh
parents:
7538
diff
changeset
|
524 BlockInfo mb_data[5 * DV_MAX_BPM], *mb, *mb1; |
|
1afa1171b7b2
Introducing DV_MAX_BPM macro instead of a hardcoded value for the
romansh
parents:
7538
diff
changeset
|
525 DECLARE_ALIGNED_16(DCTELEM, sblock[5*DV_MAX_BPM][64]); |
| 3089 | 526 DECLARE_ALIGNED_8(uint8_t, mb_bit_buffer[80 + 4]); /* allow some slack */ |
| 527 DECLARE_ALIGNED_8(uint8_t, vs_bit_buffer[5 * 80 + 4]); /* allow some slack */ | |
| 8051 | 528 const int log2_blocksize = 3-s->avctx->lowres; |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
529 int is_field_mode[5]; |
| 2967 | 530 |
| 8051 | 531 assert((((int)mb_bit_buffer) & 7) == 0); |
| 532 assert((((int)vs_bit_buffer) & 7) == 0); | |
| 2967 | 533 |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
534 memset(sblock, 0, sizeof(sblock)); |
| 723 | 535 |
| 536 /* pass 1 : read DC and AC coefficients in blocks */ | |
| 8131 | 537 buf_ptr = &s->buf[work_chunk->buf_offset*80]; |
| 8051 | 538 block1 = &sblock[0][0]; |
| 539 mb1 = mb_data; | |
|
1522
79dddc5cd990
removed the obsolete and unused parameters of init_put_bits
alex
parents:
1507
diff
changeset
|
540 init_put_bits(&vs_pb, vs_bit_buffer, 5 * 80); |
| 8051 | 541 for (mb_index = 0; mb_index < 5; mb_index++, mb1 += s->sys->bpm, block1 += s->sys->bpm * 64) { |
| 723 | 542 /* skip header */ |
| 543 quant = buf_ptr[3] & 0x0f; | |
| 544 buf_ptr += 4; | |
|
1522
79dddc5cd990
removed the obsolete and unused parameters of init_put_bits
alex
parents:
1507
diff
changeset
|
545 init_put_bits(&pb, mb_bit_buffer, 80); |
| 8051 | 546 mb = mb1; |
| 723 | 547 block = block1; |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
548 is_field_mode[mb_index] = 0; |
| 8051 | 549 for (j = 0; j < s->sys->bpm; j++) { |
|
7616
685ef77c9fe5
Making block size in bits variable and dependent on the DV spec
romansh
parents:
7615
diff
changeset
|
550 last_index = s->sys->block_sizes[j]; |
| 2979 | 551 init_get_bits(&gb, buf_ptr, last_index); |
| 2967 | 552 |
| 723 | 553 /* get the dc */ |
| 8051 | 554 dc = get_sbits(&gb, 9); |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
555 dct_mode = get_bits1(&gb); |
| 8051 | 556 class1 = get_bits(&gb, 2); |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
557 if (DV_PROFILE_IS_HD(s->sys)) { |
| 8051 | 558 mb->idct_put = s->idct_put[0]; |
| 559 mb->scan_table = s->dv_zigzag[0]; | |
| 560 mb->factor_table = s->dv100_idct_factor[((s->sys->height == 720) << 1) | (j >= 4)][class1][quant]; | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
561 is_field_mode[mb_index] |= !j && dct_mode; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
562 } else { |
| 8051 | 563 mb->idct_put = s->idct_put[dct_mode && log2_blocksize == 3]; |
| 564 mb->scan_table = s->dv_zigzag[dct_mode]; | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
565 mb->factor_table = s->dv_idct_factor[class1 == 3][dct_mode] |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
566 [quant + dv_quant_offset[class1]]; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
567 } |
| 723 | 568 dc = dc << 2; |
| 569 /* convert to unsigned because 128 is not added in the | |
| 570 standard IDCT */ | |
| 571 dc += 1024; | |
| 572 block[0] = dc; | |
| 573 buf_ptr += last_index >> 3; | |
| 8051 | 574 mb->pos = 0; |
| 725 | 575 mb->partial_bit_count = 0; |
| 723 | 576 |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
577 #ifdef VLC_DEBUG |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
578 printf("MB block: %d, %d ", mb_index, j); |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
579 #endif |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
580 dv_decode_ac(&gb, mb, block); |
| 723 | 581 |
| 582 /* write the remaining bits in a new buffer only if the | |
| 583 block is finished */ | |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
584 if (mb->pos >= 64) |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
585 bit_copy(&pb, &gb); |
| 2967 | 586 |
| 723 | 587 block += 64; |
| 725 | 588 mb++; |
| 723 | 589 } |
| 2967 | 590 |
| 723 | 591 /* pass 2 : we can do it just after */ |
| 592 #ifdef VLC_DEBUG | |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
593 printf("***pass 2 size=%d MB#=%d\n", put_bits_count(&pb), mb_index); |
| 723 | 594 #endif |
| 595 block = block1; | |
| 8051 | 596 mb = mb1; |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
597 init_get_bits(&gb, mb_bit_buffer, put_bits_count(&pb)); |
| 2979 | 598 flush_put_bits(&pb); |
| 8051 | 599 for (j = 0; j < s->sys->bpm; j++, block += 64, mb++) { |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
600 if (mb->pos < 64 && get_bits_left(&gb) > 0) { |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
601 dv_decode_ac(&gb, mb, block); |
| 723 | 602 /* if still not finished, no need to parse other blocks */ |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
603 if (mb->pos < 64) |
|
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
604 break; |
| 723 | 605 } |
| 606 } | |
| 607 /* all blocks are finished, so the extra bytes can be used at | |
| 608 the video segment level */ | |
|
7615
290fd3ae1219
Making the number of blocks per macroblock dependent on the DV stream
romansh
parents:
7614
diff
changeset
|
609 if (j >= s->sys->bpm) |
| 2979 | 610 bit_copy(&vs_pb, &gb); |
| 723 | 611 } |
| 612 | |
| 613 /* we need a pass other the whole video segment */ | |
| 614 #ifdef VLC_DEBUG | |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
615 printf("***pass 3 size=%d\n", put_bits_count(&vs_pb)); |
| 723 | 616 #endif |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
617 block = &sblock[0][0]; |
| 8051 | 618 mb = mb_data; |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
619 init_get_bits(&gb, vs_bit_buffer, put_bits_count(&vs_pb)); |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
620 flush_put_bits(&vs_pb); |
| 8051 | 621 for (mb_index = 0; mb_index < 5; mb_index++) { |
| 622 for (j = 0; j < s->sys->bpm; j++) { | |
|
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
623 if (mb->pos < 64) { |
| 723 | 624 #ifdef VLC_DEBUG |
| 625 printf("start %d:%d\n", mb_index, j); | |
| 626 #endif | |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
627 dv_decode_ac(&gb, mb, block); |
| 723 | 628 } |
| 2979 | 629 if (mb->pos >= 64 && mb->pos < 127) |
| 630 av_log(NULL, AV_LOG_ERROR, "AC EOB marker is absent pos=%d\n", mb->pos); | |
| 723 | 631 block += 64; |
| 725 | 632 mb++; |
| 723 | 633 } |
| 634 } | |
| 2967 | 635 |
| 723 | 636 /* compute idct and place blocks */ |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
637 block = &sblock[0][0]; |
| 8051 | 638 mb = mb_data; |
| 639 for (mb_index = 0; mb_index < 5; mb_index++) { | |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
640 dv_calculate_mb_xy(s, work_chunk, mb_index, &mb_x, &mb_y); |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
641 |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
642 /* idct_put'ting luminance */ |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
643 if ((s->sys->pix_fmt == PIX_FMT_YUV420P) || |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
644 (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x >= (704 / 8)) || |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
645 (s->sys->height >= 720 && mb_y != 134)) { |
| 8051 | 646 y_stride = (s->picture.linesize[0] << ((!is_field_mode[mb_index]) * log2_blocksize)); |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
647 } else { |
| 8051 | 648 y_stride = (2 << log2_blocksize); |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
649 } |
| 8051 | 650 y_ptr = s->picture.data[0] + ((mb_y * s->picture.linesize[0] + mb_x) << log2_blocksize); |
| 651 linesize = s->picture.linesize[0] << is_field_mode[mb_index]; | |
| 652 mb[0] .idct_put(y_ptr , linesize, block + 0*64); | |
| 8011 | 653 if (s->sys->video_stype == 4) { /* SD 422 */ |
| 8051 | 654 mb[2].idct_put(y_ptr + (1 << log2_blocksize) , linesize, block + 2*64); |
| 8011 | 655 } else { |
| 8051 | 656 mb[1].idct_put(y_ptr + (1 << log2_blocksize) , linesize, block + 1*64); |
| 657 mb[2].idct_put(y_ptr + y_stride, linesize, block + 2*64); | |
| 658 mb[3].idct_put(y_ptr + (1 << log2_blocksize) + y_stride, linesize, block + 3*64); | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
659 } |
| 8011 | 660 mb += 4; |
| 661 block += 4*64; | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
662 |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
663 /* idct_put'ting chrominance */ |
| 8051 | 664 c_offset = (((mb_y >> (s->sys->pix_fmt == PIX_FMT_YUV420P)) * s->picture.linesize[1] + |
| 665 (mb_x >> ((s->sys->pix_fmt == PIX_FMT_YUV411P) ? 2 : 1))) << log2_blocksize); | |
| 666 for (j = 2; j; j--) { | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
667 uint8_t *c_ptr = s->picture.data[j] + c_offset; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
668 if (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x >= (704 / 8)) { |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
669 uint64_t aligned_pixels[64/8]; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
670 uint8_t *pixels = (uint8_t*)aligned_pixels; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
671 uint8_t *c_ptr1, *ptr1; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
672 int x, y; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
673 mb->idct_put(pixels, 8, block); |
| 8051 | 674 for (y = 0; y < (1 << log2_blocksize); y++, c_ptr += s->picture.linesize[j], pixels += 8) { |
| 675 ptr1 = pixels + (1 << (log2_blocksize - 1)); | |
| 676 c_ptr1 = c_ptr + (s->picture.linesize[j] << log2_blocksize); | |
| 677 for (x = 0; x < (1 << (log2_blocksize - 1)); x++) { | |
| 678 c_ptr[x] = pixels[x]; | |
| 679 c_ptr1[x] = ptr1[x]; | |
|
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
680 } |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
681 } |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
682 block += 64; mb++; |
|
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
683 } else { |
| 8051 | 684 y_stride = (mb_y == 134) ? (1 << log2_blocksize) : |
| 685 s->picture.linesize[j] << ((!is_field_mode[mb_index]) * log2_blocksize); | |
| 686 linesize = s->picture.linesize[j] << is_field_mode[mb_index]; | |
| 687 (mb++)-> idct_put(c_ptr , linesize, block); block += 64; | |
| 8011 | 688 if (s->sys->bpm == 8) { |
| 8051 | 689 (mb++)->idct_put(c_ptr + y_stride, linesize, block); block += 64; |
| 8011 | 690 } |
| 723 | 691 } |
| 692 } | |
| 693 } | |
| 8163 | 694 return 0; |
| 723 | 695 } |
| 696 | |
|
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
697 #if ENABLE_SMALL |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
698 /* Converts run and level (where level != 0) pair into vlc, returning bit size */ |
|
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
699 static av_always_inline int dv_rl2vlc(int run, int level, int sign, uint32_t* vlc) |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
700 { |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
701 int size; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
702 if (run < DV_VLC_MAP_RUN_SIZE && level < DV_VLC_MAP_LEV_SIZE) { |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
703 *vlc = dv_vlc_map[run][level].vlc | sign; |
| 2979 | 704 size = dv_vlc_map[run][level].size; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
705 } |
| 2967 | 706 else { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
707 if (level < DV_VLC_MAP_LEV_SIZE) { |
| 2979 | 708 *vlc = dv_vlc_map[0][level].vlc | sign; |
| 709 size = dv_vlc_map[0][level].size; | |
| 710 } else { | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
711 *vlc = 0xfe00 | (level << 1) | sign; |
| 2979 | 712 size = 16; |
| 713 } | |
| 714 if (run) { | |
| 715 *vlc |= ((run < 16) ? dv_vlc_map[run-1][0].vlc : | |
| 716 (0x1f80 | (run - 1))) << size; | |
| 8051 | 717 size += (run < 16) ? dv_vlc_map[run-1][0].size : 13; |
| 2979 | 718 } |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
719 } |
| 2967 | 720 |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
721 return size; |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
722 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
723 |
|
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
724 static av_always_inline int dv_rl2vlc_size(int run, int level) |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
725 { |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
726 int size; |
| 2967 | 727 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
728 if (run < DV_VLC_MAP_RUN_SIZE && level < DV_VLC_MAP_LEV_SIZE) { |
| 2979 | 729 size = dv_vlc_map[run][level].size; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
730 } |
| 2967 | 731 else { |
| 2979 | 732 size = (level < DV_VLC_MAP_LEV_SIZE) ? dv_vlc_map[0][level].size : 16; |
| 733 if (run) { | |
| 734 size += (run < 16) ? dv_vlc_map[run-1][0].size : 13; | |
| 735 } | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
736 } |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
737 return size; |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
738 } |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
739 #else |
|
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
740 static av_always_inline int dv_rl2vlc(int run, int l, int sign, uint32_t* vlc) |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
741 { |
| 2847 | 742 *vlc = dv_vlc_map[run][l].vlc | sign; |
| 743 return dv_vlc_map[run][l].size; | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
744 } |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
745 |
|
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
746 static av_always_inline int dv_rl2vlc_size(int run, int l) |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
747 { |
| 2847 | 748 return dv_vlc_map[run][l].size; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
749 } |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
750 #endif |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
751 |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
752 typedef struct EncBlockInfo { |
| 8051 | 753 int area_q[4]; |
| 754 int bit_size[4]; | |
| 755 int prev[5]; | |
| 756 int cur_ac; | |
| 757 int cno; | |
| 758 int dct_mode; | |
| 759 DCTELEM mb[64]; | |
| 760 uint8_t next[64]; | |
| 761 uint8_t sign[64]; | |
| 762 uint8_t partial_bit_count; | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
763 uint32_t partial_bit_buffer; /* we can't use uint16_t here */ |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
764 } EncBlockInfo; |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
765 |
| 8051 | 766 static av_always_inline PutBitContext* dv_encode_ac(EncBlockInfo* bi, |
| 767 PutBitContext* pb_pool, | |
| 768 PutBitContext* pb_end) | |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
769 { |
| 8051 | 770 int prev, bits_left; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
771 PutBitContext* pb = pb_pool; |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
772 int size = bi->partial_bit_count; |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
773 uint32_t vlc = bi->partial_bit_buffer; |
| 2847 | 774 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
775 bi->partial_bit_count = bi->partial_bit_buffer = 0; |
| 8051 | 776 for (;;){ |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
777 /* Find suitable storage space */ |
|
1875
45a1592dadca
* moving some of the commonly used bit reading/writing functions
romansh
parents:
1726
diff
changeset
|
778 for (; size > (bits_left = put_bits_left(pb)); pb++) { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
779 if (bits_left) { |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
780 size -= bits_left; |
| 2979 | 781 put_bits(pb, bits_left, vlc >> size); |
| 8051 | 782 vlc = vlc & ((1 << size) - 1); |
| 2979 | 783 } |
| 784 if (pb + 1 >= pb_end) { | |
| 8051 | 785 bi->partial_bit_count = size; |
| 2979 | 786 bi->partial_bit_buffer = vlc; |
| 787 return pb; | |
| 788 } | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
789 } |
| 2967 | 790 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
791 /* Store VLC */ |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
792 put_bits(pb, size, vlc); |
| 2967 | 793 |
| 8051 | 794 if (bi->cur_ac >= 64) |
| 2847 | 795 break; |
| 2967 | 796 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
797 /* Construct the next VLC */ |
| 8051 | 798 prev = bi->cur_ac; |
| 2847 | 799 bi->cur_ac = bi->next[prev]; |
| 8051 | 800 if (bi->cur_ac < 64){ |
| 2847 | 801 size = dv_rl2vlc(bi->cur_ac - prev - 1, bi->mb[bi->cur_ac], bi->sign[bi->cur_ac], &vlc); |
| 802 } else { | |
| 803 size = 4; vlc = 6; /* End Of Block stamp */ | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
804 } |
| 2847 | 805 } |
| 806 return pb; | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
807 } |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
808 |
|
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
809 static av_always_inline void dv_set_class_number(DCTELEM* blk, EncBlockInfo* bi, |
| 8051 | 810 const uint8_t* zigzag_scan, |
| 811 const int *weight, int bias) | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
812 { |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
813 int i, area; |
|
3152
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
814 /* We offer two different methods for class number assignment: the |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
815 method suggested in SMPTE 314M Table 22, and an improved |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
816 method. The SMPTE method is very conservative; it assigns class |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
817 3 (i.e. severe quantization) to any block where the largest AC |
| 7980 | 818 component is greater than 36. FFmpeg's DV encoder tracks AC bit |
|
3152
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
819 consumption precisely, so there is no need to bias most blocks |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
820 towards strongly lossy compression. Instead, we assign class 2 |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
821 to most blocks, and use class 3 only when strictly necessary |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
822 (for blocks whose largest AC component exceeds 255). */ |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
823 |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
824 #if 0 /* SMPTE spec method */ |
| 2847 | 825 static const int classes[] = {12, 24, 36, 0xffff}; |
| 7980 | 826 #else /* improved FFmpeg method */ |
|
3152
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
827 static const int classes[] = {-1, -1, 255, 0xffff}; |
|
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
828 #endif |
| 8051 | 829 int max = classes[0]; |
| 830 int prev = 0; | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
831 |
| 2967 | 832 bi->mb[0] = blk[0]; |
| 833 | |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
834 for (area = 0; area < 4; area++) { |
| 8051 | 835 bi->prev[area] = prev; |
| 2847 | 836 bi->bit_size[area] = 1; // 4 areas 4 bits for EOB :) |
| 8051 | 837 for (i = mb_area_start[area]; i < mb_area_start[area+1]; i++) { |
| 2847 | 838 int level = blk[zigzag_scan[i]]; |
| 2967 | 839 |
| 8051 | 840 if (level + 15 > 30U) { |
| 841 bi->sign[i] = (level >> 31) & 1; | |
|
3149
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
842 /* weigh it and and shift down into range, adding for rounding */ |
|
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
843 /* the extra division by a factor of 2^4 reverses the 8x expansion of the DCT |
|
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
844 AND the 2x doubling of the weights */ |
| 8051 | 845 level = (FFABS(level) * weight[i] + (1 << (dv_weight_bits+3))) >> (dv_weight_bits+4); |
|
3149
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
846 bi->mb[i] = level; |
| 8051 | 847 if (level > max) |
| 848 max = level; | |
| 2847 | 849 bi->bit_size[area] += dv_rl2vlc_size(i - prev - 1, level); |
| 850 bi->next[prev]= i; | |
| 8051 | 851 prev = i; |
| 2847 | 852 } |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
853 } |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
854 } |
| 2847 | 855 bi->next[prev]= i; |
| 8051 | 856 for (bi->cno = 0; max > classes[bi->cno]; bi->cno++); |
| 2847 | 857 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
858 bi->cno += bias; |
| 2967 | 859 |
| 2847 | 860 if (bi->cno >= 3) { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
861 bi->cno = 3; |
| 8051 | 862 prev = 0; |
| 863 i = bi->next[prev]; | |
| 2847 | 864 for (area = 0; area < 4; area++) { |
| 8051 | 865 bi->prev[area] = prev; |
| 2847 | 866 bi->bit_size[area] = 1; // 4 areas 4 bits for EOB :) |
| 8051 | 867 for (; i < mb_area_start[area+1]; i = bi->next[i]) { |
| 868 bi->mb[i] >>= 1; | |
| 2967 | 869 |
| 2847 | 870 if (bi->mb[i]) { |
| 871 bi->bit_size[area] += dv_rl2vlc_size(i - prev - 1, bi->mb[i]); | |
| 872 bi->next[prev]= i; | |
| 8051 | 873 prev = i; |
| 2847 | 874 } |
| 875 } | |
| 876 } | |
| 877 bi->next[prev]= i; | |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
878 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
879 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
880 |
| 2847 | 881 //FIXME replace this by dsputil |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
882 #define SC(x, y) ((s[x] - s[y]) ^ ((s[x] - s[y]) >> 7)) |
|
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
883 static av_always_inline int dv_guess_dct_mode(DCTELEM *blk) { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
884 DCTELEM *s; |
| 8051 | 885 int score88 = 0; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
886 int score248 = 0; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
887 int i; |
| 2967 | 888 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
889 /* Compute 8-8 score (small values give a better chance for 8-8 DCT) */ |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
890 s = blk; |
| 8051 | 891 for (i = 0; i < 7; i++) { |
| 2967 | 892 score88 += SC(0, 8) + SC(1, 9) + SC(2, 10) + SC(3, 11) + |
| 2979 | 893 SC(4, 12) + SC(5,13) + SC(6, 14) + SC(7, 15); |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
894 s += 8; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
895 } |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
896 /* Compute 2-4-8 score (small values give a better chance for 2-4-8 DCT) */ |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
897 s = blk; |
| 8051 | 898 for (i = 0; i < 6; i++) { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
899 score248 += SC(0, 16) + SC(1,17) + SC(2, 18) + SC(3, 19) + |
| 2979 | 900 SC(4, 20) + SC(5,21) + SC(6, 22) + SC(7, 23); |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
901 s += 8; |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
902 } |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
903 |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
904 return (score88 - score248 > -10); |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
905 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
906 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
907 static inline void dv_guess_qnos(EncBlockInfo* blks, int* qnos) |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
908 { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
909 int size[5]; |
| 3140 | 910 int i, j, k, a, prev, a2; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
911 EncBlockInfo* b; |
| 2847 | 912 |
| 8051 | 913 size[0] = size[1] = size[2] = size[3] = size[4] = 1 << 24; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
914 do { |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
915 b = blks; |
| 8051 | 916 for (i = 0; i < 5; i++) { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
917 if (!qnos[i]) |
| 2979 | 918 continue; |
| 2967 | 919 |
| 2979 | 920 qnos[i]--; |
| 921 size[i] = 0; | |
| 8051 | 922 for (j = 0; j < 6; j++, b++) { |
| 923 for (a = 0; a < 4; a++) { | |
| 2979 | 924 if (b->area_q[a] != dv_quant_shifts[qnos[i] + dv_quant_offset[b->cno]][a]) { |
| 925 b->bit_size[a] = 1; // 4 areas 4 bits for EOB :) | |
| 926 b->area_q[a]++; | |
| 8051 | 927 prev = b->prev[a]; |
| 3147 | 928 assert(b->next[prev] >= mb_area_start[a+1] || b->mb[prev]); |
| 8051 | 929 for (k = b->next[prev] ; k < mb_area_start[a+1]; k = b->next[k]) { |
| 2979 | 930 b->mb[k] >>= 1; |
| 931 if (b->mb[k]) { | |
| 2847 | 932 b->bit_size[a] += dv_rl2vlc_size(k - prev - 1, b->mb[k]); |
| 8051 | 933 prev = k; |
| 2847 | 934 } else { |
| 8051 | 935 if (b->next[k] >= mb_area_start[a+1] && b->next[k]<64){ |
| 936 for (a2 = a + 1; b->next[k] >= mb_area_start[a2+1]; a2++) | |
|
3146
dcae1bde37ac
size[0-3] are not initialized (and can get random negative trash
michael
parents:
3143
diff
changeset
|
937 b->prev[a2] = prev; |
| 8051 | 938 assert(a2 < 4); |
| 3140 | 939 assert(b->mb[b->next[k]]); |
| 940 b->bit_size[a2] += dv_rl2vlc_size(b->next[k] - prev - 1, b->mb[b->next[k]]) | |
| 941 -dv_rl2vlc_size(b->next[k] - k - 1, b->mb[b->next[k]]); | |
| 8051 | 942 assert(b->prev[a2] == k && (a2 + 1 >= 4 || b->prev[a2+1] != k)); |
| 3147 | 943 b->prev[a2] = prev; |
| 3140 | 944 } |
| 2847 | 945 b->next[prev] = b->next[k]; |
| 946 } | |
| 2979 | 947 } |
| 2847 | 948 b->prev[a+1]= prev; |
| 2979 | 949 } |
| 950 size[i] += b->bit_size[a]; | |
| 951 } | |
| 952 } | |
| 8051 | 953 if (vs_total_ac_bits >= size[0] + size[1] + size[2] + size[3] + size[4]) |
| 3142 | 954 return; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
955 } |
| 3140 | 956 } while (qnos[0]|qnos[1]|qnos[2]|qnos[3]|qnos[4]); |
| 957 | |
| 958 | |
| 8051 | 959 for (a = 2; a == 2 || vs_total_ac_bits < size[0]; a += a){ |
| 3140 | 960 b = blks; |
| 8051 | 961 size[0] = 5 * 6 * 4; //EOB |
| 962 for (j = 0; j < 6 *5; j++, b++) { | |
| 963 prev = b->prev[0]; | |
| 964 for (k = b->next[prev]; k < 64; k = b->next[k]) { | |
| 965 if (b->mb[k] < a && b->mb[k] > -a){ | |
| 3140 | 966 b->next[prev] = b->next[k]; |
| 967 }else{ | |
| 968 size[0] += dv_rl2vlc_size(k - prev - 1, b->mb[k]); | |
| 8051 | 969 prev = k; |
| 3140 | 970 } |
| 971 } | |
| 972 } | |
| 973 } | |
| 1567 | 974 } |
| 975 | |
| 8163 | 976 static int dv_encode_video_segment(AVCodecContext *avctx, DVwork_chunk *work_chunk) |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
977 { |
| 8163 | 978 DVVideoContext *s = avctx->priv_data; |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
979 int mb_index, i, j; |
| 2967 | 980 int mb_x, mb_y, c_offset, linesize; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
981 uint8_t* y_ptr; |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
982 uint8_t* data; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
983 uint8_t* ptr; |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
984 uint8_t* dif; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
985 int do_edge_wrap; |
|
4675
c23a5c8263bc
force 16-bytes alignement of block array, as needed by the implementation of ff_dct_sse2
gpoirier
parents:
4666
diff
changeset
|
986 DECLARE_ALIGNED_16(DCTELEM, block[64]); |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
987 EncBlockInfo enc_blks[5*6]; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
988 PutBitContext pbs[5*6]; |
| 2967 | 989 PutBitContext* pb; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
990 EncBlockInfo* enc_blk; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
991 int vs_bit_size = 0; |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
992 int qnos[5]; |
| 2967 | 993 |
|
4675
c23a5c8263bc
force 16-bytes alignement of block array, as needed by the implementation of ff_dct_sse2
gpoirier
parents:
4666
diff
changeset
|
994 assert((((int)block) & 15) == 0); |
| 2967 | 995 |
| 8131 | 996 dif = &s->buf[work_chunk->buf_offset*80]; |
| 1567 | 997 enc_blk = &enc_blks[0]; |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
998 pb = &pbs[0]; |
| 8051 | 999 for (mb_index = 0; mb_index < 5; mb_index++) { |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
1000 dv_calculate_mb_xy(s, work_chunk, mb_index, &mb_x, &mb_y); |
| 8051 | 1001 y_ptr = s->picture.data[0] + ((mb_y * s->picture.linesize[0] + mb_x) << 3); |
| 1002 c_offset = (((mb_y >> (s->sys->pix_fmt == PIX_FMT_YUV420P)) * s->picture.linesize[1] + | |
| 1003 (mb_x >> ((s->sys->pix_fmt == PIX_FMT_YUV411P) ? 2 : 1))) << 3); | |
| 1004 do_edge_wrap = 0; | |
| 2979 | 1005 qnos[mb_index] = 15; /* No quantization */ |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1006 ptr = dif + mb_index*80 + 4; |
| 8051 | 1007 for (j = 0; j < 6; j++) { |
| 3167 | 1008 int dummy = 0; |
| 1009 if (s->sys->pix_fmt == PIX_FMT_YUV422P) { /* 4:2:2 */ | |
| 1010 if (j == 0 || j == 2) { | |
| 1011 /* Y0 Y1 */ | |
| 8051 | 1012 data = y_ptr + ((j >> 1) * 8); |
| 3167 | 1013 linesize = s->picture.linesize[0]; |
| 1014 } else if (j > 3) { | |
| 1015 /* Cr Cb */ | |
| 8051 | 1016 data = s->picture.data[6 - j] + c_offset; |
| 3167 | 1017 linesize = s->picture.linesize[6 - j]; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1018 } else { |
| 3167 | 1019 /* j=1 and j=3 are "dummy" blocks, used for AC data only */ |
| 8051 | 1020 data = 0; |
| 3167 | 1021 linesize = 0; |
| 8051 | 1022 dummy = 1; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1023 } |
| 3167 | 1024 } else { /* 4:1:1 or 4:2:0 */ |
| 1025 if (j < 4) { /* Four Y blocks */ | |
| 1026 /* NOTE: at end of line, the macroblock is handled as 420 */ | |
| 1027 if (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x < (704 / 8)) { | |
| 1028 data = y_ptr + (j * 8); | |
| 1029 } else { | |
| 1030 data = y_ptr + ((j & 1) * 8) + ((j >> 1) * 8 * s->picture.linesize[0]); | |
| 1031 } | |
| 1032 linesize = s->picture.linesize[0]; | |
| 1033 } else { /* Cr and Cb blocks */ | |
| 1034 /* don't ask Fabrice why they inverted Cb and Cr ! */ | |
| 8051 | 1035 data = s->picture.data [6 - j] + c_offset; |
| 3167 | 1036 linesize = s->picture.linesize[6 - j]; |
| 1037 if (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x >= (704 / 8)) | |
| 1038 do_edge_wrap = 1; | |
| 1039 } | |
| 2979 | 1040 } |
| 2967 | 1041 |
| 2979 | 1042 /* Everything is set up -- now just copy data -> DCT block */ |
| 1043 if (do_edge_wrap) { /* Edge wrap copy: 4x16 -> 8x8 */ | |
| 1044 uint8_t* d; | |
| 1045 DCTELEM *b = block; | |
| 8051 | 1046 for (i = 0; i < 8; i++) { |
| 2979 | 1047 d = data + 8 * linesize; |
| 1048 b[0] = data[0]; b[1] = data[1]; b[2] = data[2]; b[3] = data[3]; | |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1049 b[4] = d[0]; b[5] = d[1]; b[6] = d[2]; b[7] = d[3]; |
| 2979 | 1050 data += linesize; |
| 1051 b += 8; | |
| 1052 } | |
| 1053 } else { /* Simple copy: 8x8 -> 8x8 */ | |
| 3167 | 1054 if (!dummy) |
| 1055 s->get_pixels(block, data, linesize); | |
| 2979 | 1056 } |
| 2967 | 1057 |
| 8051 | 1058 if (s->avctx->flags & CODEC_FLAG_INTERLACED_DCT) |
| 2847 | 1059 enc_blk->dct_mode = dv_guess_dct_mode(block); |
| 1060 else | |
| 1061 enc_blk->dct_mode = 0; | |
| 2979 | 1062 enc_blk->area_q[0] = enc_blk->area_q[1] = enc_blk->area_q[2] = enc_blk->area_q[3] = 0; |
| 1063 enc_blk->partial_bit_count = 0; | |
| 1064 enc_blk->partial_bit_buffer = 0; | |
| 1065 enc_blk->cur_ac = 0; | |
| 2967 | 1066 |
| 3167 | 1067 if (dummy) { |
| 1068 /* We rely on the fact that encoding all zeros leads to an immediate EOB, | |
| 1069 which is precisely what the spec calls for in the "dummy" blocks. */ | |
| 1070 memset(block, 0, sizeof(block)); | |
| 1071 } else { | |
| 1072 s->fdct[enc_blk->dct_mode](block); | |
| 1073 } | |
| 2967 | 1074 |
| 2979 | 1075 dv_set_class_number(block, enc_blk, |
|
3149
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
1076 enc_blk->dct_mode ? ff_zigzag248_direct : ff_zigzag_direct, |
|
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
1077 enc_blk->dct_mode ? dv_weight_248 : dv_weight_88, |
|
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
1078 j/4); |
| 2967 | 1079 |
|
7616
685ef77c9fe5
Making block size in bits variable and dependent on the DV spec
romansh
parents:
7615
diff
changeset
|
1080 init_put_bits(pb, ptr, s->sys->block_sizes[j]/8); |
| 2979 | 1081 put_bits(pb, 9, (uint16_t)(((enc_blk->mb[0] >> 3) - 1024 + 2) >> 2)); |
| 1082 put_bits(pb, 1, enc_blk->dct_mode); | |
| 1083 put_bits(pb, 2, enc_blk->cno); | |
| 2967 | 1084 |
| 2979 | 1085 vs_bit_size += enc_blk->bit_size[0] + enc_blk->bit_size[1] + |
| 1086 enc_blk->bit_size[2] + enc_blk->bit_size[3]; | |
| 1087 ++enc_blk; | |
| 1088 ++pb; | |
|
7616
685ef77c9fe5
Making block size in bits variable and dependent on the DV spec
romansh
parents:
7615
diff
changeset
|
1089 ptr += s->sys->block_sizes[j]/8; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1090 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1091 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1092 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1093 if (vs_total_ac_bits < vs_bit_size) |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1094 dv_guess_qnos(&enc_blks[0], &qnos[0]); |
|
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1095 |
| 8051 | 1096 for (i = 0; i < 5; i++) { |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1097 dif[i*80 + 3] = qnos[i]; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1098 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1099 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1100 /* First pass over individual cells only */ |
| 8051 | 1101 for (j = 0; j < 5 * 6; j++) |
| 2847 | 1102 dv_encode_ac(&enc_blks[j], &pbs[j], &pbs[j+1]); |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1103 |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1104 /* Second pass over each MB space */ |
| 8051 | 1105 for (j = 0; j < 5 * 6; j += 6) { |
| 1106 pb = &pbs[j]; | |
| 1107 for (i = 0; i < 6; i++) { | |
| 2847 | 1108 if (enc_blks[i+j].partial_bit_count) |
| 8051 | 1109 pb = dv_encode_ac(&enc_blks[i+j], pb, &pbs[j+6]); |
| 2847 | 1110 } |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1111 } |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1112 |
| 8050 | 1113 /* Third and final pass over the whole video segment space */ |
| 8051 | 1114 pb = &pbs[0]; |
| 1115 for (j = 0; j < 5 * 6; j++) { | |
| 2847 | 1116 if (enc_blks[j].partial_bit_count) |
| 8051 | 1117 pb = dv_encode_ac(&enc_blks[j], pb, &pbs[6*5]); |
|
3139
e58fb7ffbb4f
print a big warning if we mess up and run out of space ...
michael
parents:
3089
diff
changeset
|
1118 if (enc_blks[j].partial_bit_count) |
|
e58fb7ffbb4f
print a big warning if we mess up and run out of space ...
michael
parents:
3089
diff
changeset
|
1119 av_log(NULL, AV_LOG_ERROR, "ac bitstream overflow\n"); |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1120 } |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1121 |
| 8051 | 1122 for (j = 0; j < 5 * 6; j++) |
|
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1123 flush_put_bits(&pbs[j]); |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1124 |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1125 return 0; |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1126 } |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1127 |
|
7776
dbcdd0165e55
Replace generic CONFIG_DECODERS preprocessor conditionals by more specific
diego
parents:
7715
diff
changeset
|
1128 #ifdef CONFIG_DVVIDEO_DECODER |
| 723 | 1129 /* NOTE: exactly one frame must be given (120000 bytes for NTSC, |
| 3167 | 1130 144000 bytes for PAL - or twice those for 50Mbps) */ |
| 2967 | 1131 static int dvvideo_decode_frame(AVCodecContext *avctx, |
| 723 | 1132 void *data, int *data_size, |
| 6218 | 1133 const uint8_t *buf, int buf_size) |
| 723 | 1134 { |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1135 DVVideoContext *s = avctx->priv_data; |
| 2967 | 1136 |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1137 s->sys = dv_frame_profile(buf); |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
1138 if (!s->sys || buf_size < s->sys->frame_size || dv_init_dynamic_tables(s->sys)) |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1139 return -1; /* NOTE: we only accept several full frames */ |
| 723 | 1140 |
| 8051 | 1141 if (s->picture.data[0]) |
| 1228 | 1142 avctx->release_buffer(avctx, &s->picture); |
| 2967 | 1143 |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1144 s->picture.reference = 0; |
|
2822
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1145 s->picture.key_frame = 1; |
|
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1146 s->picture.pict_type = FF_I_TYPE; |
| 8051 | 1147 avctx->pix_fmt = s->sys->pix_fmt; |
|
8014
07d8986fbea7
replacing frame_rate and frame_rate_base with an AVRational time_base
romansh
parents:
8011
diff
changeset
|
1148 avctx->time_base = s->sys->time_base; |
| 2849 | 1149 avcodec_set_dimensions(avctx, s->sys->width, s->sys->height); |
| 8051 | 1150 if (avctx->get_buffer(avctx, &s->picture) < 0) { |
|
1598
932d306bf1dc
av_log() patch by (Michel Bardiaux <mbardiaux at peaktime dot be>)
michael
parents:
1567
diff
changeset
|
1151 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n"); |
| 903 | 1152 return -1; |
| 835 | 1153 } |
|
1543
7542cb99b950
* providing MPEG codecs with a generic fields in AVFrame to use.
romansh
parents:
1540
diff
changeset
|
1154 s->picture.interlaced_frame = 1; |
| 8051 | 1155 s->picture.top_field_first = 0; |
| 835 | 1156 |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1157 s->buf = buf; |
| 8163 | 1158 avctx->execute(avctx, dv_decode_video_segment, s->sys->work_chunks, NULL, |
| 8131 | 1159 dv_work_pool_size(s->sys), sizeof(DVwork_chunk)); |
| 2967 | 1160 |
|
734
2d6b3e3d6c6f
10l - MMX/FPU state was not restored, causing nonsense fpu behaviour in caller (mplayer)
arpi_esp
parents:
733
diff
changeset
|
1161 emms_c(); |
|
2d6b3e3d6c6f
10l - MMX/FPU state was not restored, causing nonsense fpu behaviour in caller (mplayer)
arpi_esp
parents:
733
diff
changeset
|
1162 |
| 723 | 1163 /* return image */ |
| 925 | 1164 *data_size = sizeof(AVFrame); |
| 8051 | 1165 *(AVFrame*)data = s->picture; |
| 2967 | 1166 |
|
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1167 return s->sys->frame_size; |
| 723 | 1168 } |
|
7776
dbcdd0165e55
Replace generic CONFIG_DECODERS preprocessor conditionals by more specific
diego
parents:
7715
diff
changeset
|
1169 #endif /* CONFIG_DVVIDEO_DECODER */ |
| 723 | 1170 |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1171 |
| 8051 | 1172 static inline int dv_write_pack(enum dv_pack_type pack_id, DVVideoContext *c, |
| 1173 uint8_t* buf) | |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1174 { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1175 /* |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1176 * Here's what SMPTE314M says about these two: |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1177 * (page 6) APTn, AP1n, AP2n, AP3n: These data shall be identical |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1178 * as track application IDs (APTn = 001, AP1n = |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1179 * 001, AP2n = 001, AP3n = 001), if the source signal |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1180 * comes from a digital VCR. If the signal source is |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1181 * unknown, all bits for these data shall be set to 1. |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1182 * (page 12) STYPE: STYPE defines a signal type of video signal |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1183 * 00000b = 4:1:1 compression |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1184 * 00100b = 4:2:2 compression |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1185 * XXXXXX = Reserved |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1186 * Now, I've got two problems with these statements: |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1187 * 1. it looks like APT == 111b should be a safe bet, but it isn't. |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1188 * It seems that for PAL as defined in IEC 61834 we have to set |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1189 * APT to 000 and for SMPTE314M to 001. |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1190 * 2. It is not at all clear what STYPE is used for 4:2:0 PAL |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1191 * compression scheme (if any). |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1192 */ |
| 8051 | 1193 int apt = (c->sys->pix_fmt == PIX_FMT_YUV420P ? 0 : 1); |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1194 int stype = (c->sys->pix_fmt == PIX_FMT_YUV422P ? 4 : 0); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1195 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1196 uint8_t aspect = 0; |
| 8051 | 1197 if ((int)(av_q2d(c->avctx->sample_aspect_ratio) * c->avctx->width / c->avctx->height * 10) == 17) /* 16:9 */ |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1198 aspect = 0x02; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1199 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1200 buf[0] = (uint8_t)pack_id; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1201 switch (pack_id) { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1202 case dv_header525: /* I can't imagine why these two weren't defined as real */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1203 case dv_header625: /* packs in SMPTE314M -- they definitely look like ones */ |
| 8051 | 1204 buf[1] = 0xf8 | /* reserved -- always 1 */ |
| 1205 (apt & 0x07); /* APT: Track application ID */ | |
| 1206 buf[2] = (0 << 7) | /* TF1: audio data is 0 - valid; 1 - invalid */ | |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1207 (0x0f << 3) | /* reserved -- always 1 */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1208 (apt & 0x07); /* AP1: Audio application ID */ |
| 8051 | 1209 buf[3] = (0 << 7) | /* TF2: video data is 0 - valid; 1 - invalid */ |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1210 (0x0f << 3) | /* reserved -- always 1 */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1211 (apt & 0x07); /* AP2: Video application ID */ |
| 8051 | 1212 buf[4] = (0 << 7) | /* TF3: subcode(SSYB) is 0 - valid; 1 - invalid */ |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1213 (0x0f << 3) | /* reserved -- always 1 */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1214 (apt & 0x07); /* AP3: Subcode application ID */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1215 break; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1216 case dv_video_source: |
| 8051 | 1217 buf[1] = 0xff; /* reserved -- always 1 */ |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1218 buf[2] = (1 << 7) | /* B/W: 0 - b/w, 1 - color */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1219 (1 << 6) | /* following CLF is valid - 0, invalid - 1 */ |
| 8050 | 1220 (3 << 4) | /* CLF: color frames ID (see ITU-R BT.470-4) */ |
| 8051 | 1221 0xf; /* reserved -- always 1 */ |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1222 buf[3] = (3 << 6) | /* reserved -- always 1 */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1223 (c->sys->dsf << 5) | /* system: 60fields/50fields */ |
| 8051 | 1224 stype; /* signal type video compression */ |
| 1225 buf[4] = 0xff; /* VISC: 0xff -- no information */ | |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1226 break; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1227 case dv_video_control: |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1228 buf[1] = (0 << 6) | /* Copy generation management (CGMS) 0 -- free */ |
| 8051 | 1229 0x3f; /* reserved -- always 1 */ |
| 1230 buf[2] = 0xc8 | /* reserved -- always b11001xxx */ | |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1231 aspect; |
| 8050 | 1232 buf[3] = (1 << 7) | /* frame/field flag 1 -- frame, 0 -- field */ |
| 1233 (1 << 6) | /* first/second field flag 0 -- field 2, 1 -- field 1 */ | |
| 1234 (1 << 5) | /* frame change flag 0 -- same picture as before, 1 -- different */ | |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1235 (1 << 4) | /* 1 - interlaced, 0 - noninterlaced */ |
| 8051 | 1236 0xc; /* reserved -- always b1100 */ |
| 1237 buf[4] = 0xff; /* reserved -- always 1 */ | |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1238 break; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1239 default: |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1240 buf[1] = buf[2] = buf[3] = buf[4] = 0xff; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1241 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1242 return 5; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1243 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1244 |
|
7240
2552555c8a92
Move #ifdef CONFIG_DVVIDEO_ENCODER up to cover all functions used for encoding.
diego
parents:
7239
diff
changeset
|
1245 #ifdef CONFIG_DVVIDEO_ENCODER |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1246 static void dv_format_frame(DVVideoContext* c, uint8_t* buf) |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1247 { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1248 int chan, i, j, k; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1249 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1250 for (chan = 0; chan < c->sys->n_difchan; chan++) { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1251 for (i = 0; i < c->sys->difseg_size; i++) { |
| 8050 | 1252 memset(buf, 0xff, 80 * 6); /* first 6 DIF blocks are for control data */ |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1253 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1254 /* DV header: 1DIF */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1255 buf += dv_write_dif_id(dv_sect_header, chan, i, 0, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1256 buf += dv_write_pack((c->sys->dsf ? dv_header625 : dv_header525), c, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1257 buf += 72; /* unused bytes */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1258 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1259 /* DV subcode: 2DIFs */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1260 for (j = 0; j < 2; j++) { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1261 buf += dv_write_dif_id(dv_sect_subcode, chan, i, j, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1262 for (k = 0; k < 6; k++) |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1263 buf += dv_write_ssyb_id(k, (i < c->sys->difseg_size/2), buf) + 5; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1264 buf += 29; /* unused bytes */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1265 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1266 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1267 /* DV VAUX: 3DIFS */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1268 for (j = 0; j < 3; j++) { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1269 buf += dv_write_dif_id(dv_sect_vaux, chan, i, j, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1270 buf += dv_write_pack(dv_video_source, c, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1271 buf += dv_write_pack(dv_video_control, c, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1272 buf += 7*5; |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1273 buf += dv_write_pack(dv_video_source, c, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1274 buf += dv_write_pack(dv_video_control, c, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1275 buf += 4*5 + 2; /* unused bytes */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1276 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1277 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1278 /* DV Audio/Video: 135 Video DIFs + 9 Audio DIFs */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1279 for (j = 0; j < 135; j++) { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1280 if (j%15 == 0) { |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1281 memset(buf, 0xff, 80); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1282 buf += dv_write_dif_id(dv_sect_audio, chan, i, j/15, buf); |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1283 buf += 77; /* audio control & shuffled PCM audio */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1284 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1285 buf += dv_write_dif_id(dv_sect_video, chan, i, j, buf); |
| 7980 | 1286 buf += 77; /* 1 video macroblock: 1 bytes control |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1287 4 * 14 bytes Y 8x8 data |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1288 10 bytes Cr 8x8 data |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1289 10 bytes Cb 8x8 data */ |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1290 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1291 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1292 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1293 } |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1294 |
|
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1295 |
| 2967 | 1296 static int dvvideo_encode_frame(AVCodecContext *c, uint8_t *buf, int buf_size, |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1297 void *data) |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1298 { |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1299 DVVideoContext *s = c->priv_data; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1300 |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1301 s->sys = dv_codec_profile(c); |
|
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
1302 if (!s->sys || buf_size < s->sys->frame_size || dv_init_dynamic_tables(s->sys)) |
| 2422 | 1303 return -1; |
| 1304 | |
| 8051 | 1305 c->pix_fmt = s->sys->pix_fmt; |
| 1306 s->picture = *((AVFrame *)data); | |
|
2822
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1307 s->picture.key_frame = 1; |
|
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1308 s->picture.pict_type = FF_I_TYPE; |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1309 |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1310 s->buf = buf; |
| 8163 | 1311 c->execute(c, dv_encode_video_segment, s->sys->work_chunks, NULL, |
| 8131 | 1312 dv_work_pool_size(s->sys), sizeof(DVwork_chunk)); |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1313 |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1314 emms_c(); |
| 3167 | 1315 |
|
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1316 dv_format_frame(s, buf); |
| 3167 | 1317 |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1318 return s->sys->frame_size; |
|
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1319 } |
| 3806 | 1320 #endif |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1321 |
|
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1322 static int dvvideo_close(AVCodecContext *c) |
|
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1323 { |
|
4352
0ee71c12734e
* Fixing a bug with incorrect bits set in AAUX source pack
romansh
parents:
4283
diff
changeset
|
1324 DVVideoContext *s = c->priv_data; |
|
0ee71c12734e
* Fixing a bug with incorrect bits set in AAUX source pack
romansh
parents:
4283
diff
changeset
|
1325 |
| 8051 | 1326 if (s->picture.data[0]) |
|
4352
0ee71c12734e
* Fixing a bug with incorrect bits set in AAUX source pack
romansh
parents:
4283
diff
changeset
|
1327 c->release_buffer(c, &s->picture); |
|
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1328 |
|
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1329 return 0; |
|
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1330 } |
|
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1331 |
|
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1332 |
|
2661
b2846918585c
a few #ifdef CONFIG_X_ENCODER, patch by (Roine Gustafsson <roine users.sourceforge net]
michael
parents:
2614
diff
changeset
|
1333 #ifdef CONFIG_DVVIDEO_ENCODER |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1334 AVCodec dvvideo_encoder = { |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1335 "dvvideo", |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1336 CODEC_TYPE_VIDEO, |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1337 CODEC_ID_DVVIDEO, |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1338 sizeof(DVVideoContext), |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1339 dvvideo_init, |
|
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1340 dvvideo_encode_frame, |
| 8051 | 1341 .pix_fmts = (enum PixelFormat[]) {PIX_FMT_YUV411P, PIX_FMT_YUV422P, PIX_FMT_YUV420P, PIX_FMT_NONE}, |
|
7040
e943e1409077
Make AVCodec long_names definition conditional depending on CONFIG_SMALL.
stefano
parents:
7039
diff
changeset
|
1342 .long_name = NULL_IF_CONFIG_SMALL("DV (Digital Video)"), |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1343 }; |
|
2661
b2846918585c
a few #ifdef CONFIG_X_ENCODER, patch by (Roine Gustafsson <roine users.sourceforge net]
michael
parents:
2614
diff
changeset
|
1344 #endif // CONFIG_DVVIDEO_ENCODER |
| 723 | 1345 |
| 3777 | 1346 #ifdef CONFIG_DVVIDEO_DECODER |
| 723 | 1347 AVCodec dvvideo_decoder = { |
| 1348 "dvvideo", | |
| 1349 CODEC_TYPE_VIDEO, | |
| 1350 CODEC_ID_DVVIDEO, | |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1351 sizeof(DVVideoContext), |
|
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1352 dvvideo_init, |
|
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1353 NULL, |
|
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1354 dvvideo_close, |
| 723 | 1355 dvvideo_decode_frame, |
| 835 | 1356 CODEC_CAP_DR1, |
| 6717 | 1357 NULL, |
|
7040
e943e1409077
Make AVCodec long_names definition conditional depending on CONFIG_SMALL.
stefano
parents:
7039
diff
changeset
|
1358 .long_name = NULL_IF_CONFIG_SMALL("DV (Digital Video)"), |
| 723 | 1359 }; |
| 3777 | 1360 #endif |
