Mercurial > libavcodec.hg
annotate msmpeg4.c @ 214:73df666cacc7 libavcodec
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
| author | nickols_k |
|---|---|
| date | Sun, 20 Jan 2002 14:48:02 +0000 |
| parents | 2eb04d6be309 |
| children | fe243b4aec02 |
| rev | line source |
|---|---|
| 0 | 1 /* |
| 2 * MSMPEG4 backend for ffmpeg encoder and decoder | |
| 3 * Copyright (c) 2001 Gerard Lantau. | |
| 4 * | |
| 5 * This program is free software; you can redistribute it and/or modify | |
| 6 * it under the terms of the GNU General Public License as published by | |
| 7 * the Free Software Foundation; either version 2 of the License, or | |
| 8 * (at your option) any later version. | |
| 9 * | |
| 10 * This program is distributed in the hope that it will be useful, | |
| 11 * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
| 12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
| 13 * GNU General Public License for more details. | |
| 14 * | |
| 15 * You should have received a copy of the GNU General Public License | |
| 16 * along with this program; if not, write to the Free Software | |
| 17 * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. | |
| 18 */ | |
| 19 #include <stdlib.h> | |
| 20 #include <stdio.h> | |
| 21 #include "common.h" | |
| 22 #include "dsputil.h" | |
| 23 #include "mpegvideo.h" | |
| 24 | |
| 25 /* | |
| 26 * You can also call this codec : MPEG4 with a twist ! | |
| 27 * | |
| 28 * TODO: | |
| 29 * - (encoding) select best mv table (two choices) | |
| 30 * - (encoding) select best vlc/dc table | |
| 31 * - (decoding) handle slice indication | |
| 32 */ | |
| 33 //#define DEBUG | |
| 34 | |
| 35 /* motion vector table */ | |
| 36 typedef struct MVTable { | |
| 37 int n; | |
| 38 const UINT16 *table_mv_code; | |
| 39 const UINT8 *table_mv_bits; | |
| 40 const UINT8 *table_mvx; | |
| 41 const UINT8 *table_mvy; | |
| 42 UINT16 *table_mv_index; /* encoding: convert mv to index in table_mv */ | |
| 43 VLC vlc; /* decoding: vlc */ | |
| 44 } MVTable; | |
| 45 | |
| 46 static void msmpeg4_encode_block(MpegEncContext * s, DCTELEM * block, int n); | |
| 47 static int msmpeg4_decode_block(MpegEncContext * s, DCTELEM * block, | |
| 48 int n, int coded); | |
| 49 static int msmpeg4_decode_dc(MpegEncContext * s, int n, int *dir_ptr); | |
| 50 static int msmpeg4_decode_motion(MpegEncContext * s, | |
| 51 int *mx_ptr, int *my_ptr); | |
| 52 | |
| 53 #ifdef DEBUG | |
| 54 int intra_count = 0; | |
| 55 int frame_count = 0; | |
| 56 #endif | |
| 57 /* XXX: move it to mpegvideo.h */ | |
| 58 | |
| 59 static int init_done = 0; | |
| 60 | |
| 61 #include "msmpeg4data.h" | |
| 62 | |
| 63 #ifdef STATS | |
| 64 | |
| 65 const char *st_names[ST_NB] = { | |
| 66 "unknown", | |
| 67 "dc", | |
| 68 "intra_ac", | |
| 69 "inter_ac", | |
| 70 "intra_mb", | |
| 71 "inter_mb", | |
| 72 "mv", | |
| 73 }; | |
| 74 | |
| 75 int st_current_index = 0; | |
| 76 unsigned int st_bit_counts[ST_NB]; | |
| 77 unsigned int st_out_bit_counts[ST_NB]; | |
| 78 | |
| 79 #define set_stat(var) st_current_index = var; | |
| 80 | |
| 81 void print_stats(void) | |
| 82 { | |
| 83 unsigned int total; | |
| 84 int i; | |
| 85 | |
| 86 printf("Input:\n"); | |
| 87 total = 0; | |
| 88 for(i=0;i<ST_NB;i++) | |
| 89 total += st_bit_counts[i]; | |
| 90 if (total == 0) | |
| 91 total = 1; | |
| 92 for(i=0;i<ST_NB;i++) { | |
| 93 printf("%-10s : %10.1f %5.1f%%\n", | |
| 94 st_names[i], | |
| 95 (double)st_bit_counts[i] / 8.0, | |
| 96 (double)st_bit_counts[i] * 100.0 / total); | |
| 97 } | |
| 98 printf("%-10s : %10.1f %5.1f%%\n", | |
| 99 "total", | |
| 100 (double)total / 8.0, | |
| 101 100.0); | |
| 102 | |
| 103 printf("Output:\n"); | |
| 104 total = 0; | |
| 105 for(i=0;i<ST_NB;i++) | |
| 106 total += st_out_bit_counts[i]; | |
| 107 if (total == 0) | |
| 108 total = 1; | |
| 109 for(i=0;i<ST_NB;i++) { | |
| 110 printf("%-10s : %10.1f %5.1f%%\n", | |
| 111 st_names[i], | |
| 112 (double)st_out_bit_counts[i] / 8.0, | |
| 113 (double)st_out_bit_counts[i] * 100.0 / total); | |
| 114 } | |
| 115 printf("%-10s : %10.1f %5.1f%%\n", | |
| 116 "total", | |
| 117 (double)total / 8.0, | |
| 118 100.0); | |
| 119 } | |
| 120 | |
| 121 #else | |
| 122 | |
| 123 #define set_stat(var) | |
| 124 | |
| 125 #endif | |
| 126 | |
| 127 /* build the table which associate a (x,y) motion vector to a vlc */ | |
| 128 static void init_mv_table(MVTable *tab) | |
| 129 { | |
| 130 int i, x, y; | |
| 131 | |
| 132 tab->table_mv_index = malloc(sizeof(UINT16) * 4096); | |
| 133 /* mark all entries as not used */ | |
| 134 for(i=0;i<4096;i++) | |
| 135 tab->table_mv_index[i] = tab->n; | |
| 136 | |
| 137 for(i=0;i<tab->n;i++) { | |
| 138 x = tab->table_mvx[i]; | |
| 139 y = tab->table_mvy[i]; | |
| 140 tab->table_mv_index[(x << 6) | y] = i; | |
| 141 } | |
| 142 } | |
| 143 | |
| 144 static void code012(PutBitContext *pb, int n) | |
| 145 { | |
| 146 if (n == 0) { | |
| 147 put_bits(pb, 1, 0); | |
| 148 } else { | |
| 149 put_bits(pb, 1, 1); | |
| 150 put_bits(pb, 1, (n >= 2)); | |
| 151 } | |
| 152 } | |
| 153 | |
| 154 /* write MSMPEG4 V3 compatible frame header */ | |
| 155 void msmpeg4_encode_picture_header(MpegEncContext * s, int picture_number) | |
| 156 { | |
| 157 int i; | |
| 158 | |
| 159 align_put_bits(&s->pb); | |
| 160 | |
| 161 put_bits(&s->pb, 2, s->pict_type - 1); | |
| 162 | |
| 163 put_bits(&s->pb, 5, s->qscale); | |
| 164 | |
| 165 s->rl_table_index = 2; | |
| 166 s->rl_chroma_table_index = 1; /* only for I frame */ | |
| 167 s->dc_table_index = 1; | |
| 168 s->mv_table_index = 1; /* only if P frame */ | |
| 169 s->use_skip_mb_code = 1; /* only if P frame */ | |
| 170 | |
| 171 if (s->pict_type == I_TYPE) { | |
| 172 put_bits(&s->pb, 5, 0x17); /* indicate only one "slice" */ | |
| 173 | |
| 174 code012(&s->pb, s->rl_chroma_table_index); | |
| 175 code012(&s->pb, s->rl_table_index); | |
| 176 | |
| 177 put_bits(&s->pb, 1, s->dc_table_index); | |
| 178 s->no_rounding = 1; | |
| 179 } else { | |
| 180 put_bits(&s->pb, 1, s->use_skip_mb_code); | |
| 181 | |
| 182 s->rl_chroma_table_index = s->rl_table_index; | |
| 183 code012(&s->pb, s->rl_table_index); | |
| 184 | |
| 185 put_bits(&s->pb, 1, s->dc_table_index); | |
| 186 | |
| 187 put_bits(&s->pb, 1, s->mv_table_index); | |
| 208 | 188 |
| 189 if(s->flipflop_rounding){ | |
| 190 s->no_rounding ^= 1; | |
| 191 }else{ | |
| 192 s->no_rounding = 0; | |
| 193 } | |
| 0 | 194 } |
| 195 | |
| 196 if (!init_done) { | |
| 197 /* init various encoding tables */ | |
| 198 init_done = 1; | |
| 199 init_mv_table(&mv_tables[0]); | |
| 200 init_mv_table(&mv_tables[1]); | |
| 201 for(i=0;i<NB_RL_TABLES;i++) | |
| 202 init_rl(&rl_table[i]); | |
| 203 } | |
| 204 | |
| 205 #ifdef DEBUG | |
| 206 intra_count = 0; | |
| 207 printf("*****frame %d:\n", frame_count++); | |
| 208 #endif | |
| 209 } | |
| 210 | |
| 208 | 211 void msmpeg4_encode_ext_header(MpegEncContext * s) |
| 212 { | |
| 213 if(s->pict_type == P_TYPE) | |
| 214 { | |
| 215 return; // P-Frames dont seem to have them and not even a 0 bit | |
| 216 } | |
| 217 else | |
| 218 { | |
| 219 s->flipflop_rounding=1; | |
| 220 s->bitrate= 910; | |
| 221 | |
| 222 put_bits(&s->pb, 1, 1); // ext header indicator | |
| 223 | |
| 224 put_bits(&s->pb, 4, 7); // ? | |
| 225 | |
| 226 put_bits(&s->pb, 11, s->bitrate); | |
| 227 | |
| 228 put_bits(&s->pb, 1, s->flipflop_rounding); | |
| 229 } | |
| 230 } | |
| 231 | |
| 0 | 232 /* predict coded block */ |
| 233 static inline int coded_block_pred(MpegEncContext * s, int n, UINT8 **coded_block_ptr) | |
| 234 { | |
| 235 int x, y, wrap, pred, a, b, c; | |
| 236 | |
| 237 x = 2 * s->mb_x + 1 + (n & 1); | |
| 238 y = 2 * s->mb_y + 1 + ((n & 2) >> 1); | |
| 239 wrap = s->mb_width * 2 + 2; | |
| 240 | |
| 241 /* B C | |
| 242 * A X | |
| 243 */ | |
| 244 a = s->coded_block[(x - 1) + (y) * wrap]; | |
| 245 b = s->coded_block[(x - 1) + (y - 1) * wrap]; | |
| 246 c = s->coded_block[(x) + (y - 1) * wrap]; | |
| 247 | |
| 248 if (b == c) { | |
| 249 pred = a; | |
| 250 } else { | |
| 251 pred = c; | |
| 252 } | |
| 253 | |
| 254 /* store value */ | |
| 255 *coded_block_ptr = &s->coded_block[(x) + (y) * wrap]; | |
| 256 | |
| 257 return pred; | |
| 258 } | |
| 259 | |
| 260 static void msmpeg4_encode_motion(MpegEncContext * s, | |
| 261 int mx, int my) | |
| 262 { | |
| 263 int code; | |
| 264 MVTable *mv; | |
| 265 | |
| 266 /* modulo encoding */ | |
| 267 /* WARNING : you cannot reach all the MVs even with the modulo | |
| 268 encoding. This is a somewhat strange compromise they took !!! */ | |
| 269 if (mx <= -64) | |
| 270 mx += 64; | |
| 271 else if (mx >= 64) | |
| 272 mx -= 64; | |
| 273 if (my <= -64) | |
| 274 my += 64; | |
| 275 else if (my >= 64) | |
| 276 my -= 64; | |
| 277 | |
| 278 mx += 32; | |
| 279 my += 32; | |
| 280 #if 0 | |
| 281 if ((unsigned)mx >= 64 || | |
| 282 (unsigned)my >= 64) | |
| 283 fprintf(stderr, "error mx=%d my=%d\n", mx, my); | |
| 284 #endif | |
| 285 mv = &mv_tables[s->mv_table_index]; | |
| 286 | |
| 287 code = mv->table_mv_index[(mx << 6) | my]; | |
| 288 set_stat(ST_MV); | |
| 289 put_bits(&s->pb, | |
| 290 mv->table_mv_bits[code], | |
| 291 mv->table_mv_code[code]); | |
| 292 if (code == mv->n) { | |
| 293 /* escape : code litterally */ | |
| 294 put_bits(&s->pb, 6, mx); | |
| 295 put_bits(&s->pb, 6, my); | |
| 296 } | |
| 297 } | |
| 298 | |
| 299 void msmpeg4_encode_mb(MpegEncContext * s, | |
| 300 DCTELEM block[6][64], | |
| 301 int motion_x, int motion_y) | |
| 302 { | |
| 303 int cbp, coded_cbp, i; | |
| 304 int pred_x, pred_y; | |
| 305 UINT8 *coded_block; | |
| 306 | |
| 307 if (!s->mb_intra) { | |
| 308 /* compute cbp */ | |
| 309 set_stat(ST_INTER_MB); | |
| 310 cbp = 0; | |
| 311 for (i = 0; i < 6; i++) { | |
| 312 if (s->block_last_index[i] >= 0) | |
| 313 cbp |= 1 << (5 - i); | |
| 314 } | |
| 315 if (s->use_skip_mb_code && (cbp | motion_x | motion_y) == 0) { | |
| 316 /* skip macroblock */ | |
| 317 put_bits(&s->pb, 1, 1); | |
| 318 return; | |
| 319 } | |
| 320 if (s->use_skip_mb_code) | |
| 321 put_bits(&s->pb, 1, 0); /* mb coded */ | |
| 322 | |
| 323 put_bits(&s->pb, | |
| 324 table_mb_non_intra[cbp + 64][1], | |
| 325 table_mb_non_intra[cbp + 64][0]); | |
| 326 | |
| 327 /* motion vector */ | |
| 328 h263_pred_motion(s, 0, &pred_x, &pred_y); | |
| 329 msmpeg4_encode_motion(s, motion_x - pred_x, | |
| 330 motion_y - pred_y); | |
| 331 } else { | |
| 332 /* compute cbp */ | |
| 333 cbp = 0; | |
| 334 coded_cbp = 0; | |
| 335 for (i = 0; i < 6; i++) { | |
| 336 int val, pred; | |
| 337 val = (s->block_last_index[i] >= 1); | |
| 338 cbp |= val << (5 - i); | |
| 339 if (i < 4) { | |
| 340 /* predict value for close blocks only for luma */ | |
| 341 pred = coded_block_pred(s, i, &coded_block); | |
| 342 *coded_block = val; | |
| 343 val = val ^ pred; | |
| 344 } | |
| 345 coded_cbp |= val << (5 - i); | |
| 346 } | |
| 347 #if 0 | |
| 348 if (coded_cbp) | |
| 349 printf("cbp=%x %x\n", cbp, coded_cbp); | |
| 350 #endif | |
| 351 | |
| 352 if (s->pict_type == I_TYPE) { | |
| 353 set_stat(ST_INTRA_MB); | |
| 354 put_bits(&s->pb, | |
| 355 table_mb_intra[coded_cbp][1], table_mb_intra[coded_cbp][0]); | |
| 356 } else { | |
| 357 if (s->use_skip_mb_code) | |
| 358 put_bits(&s->pb, 1, 0); /* mb coded */ | |
| 359 put_bits(&s->pb, | |
| 360 table_mb_non_intra[cbp][1], | |
| 361 table_mb_non_intra[cbp][0]); | |
| 362 } | |
| 363 set_stat(ST_INTRA_MB); | |
| 364 put_bits(&s->pb, 1, 0); /* no AC prediction yet */ | |
| 365 } | |
| 366 | |
| 367 for (i = 0; i < 6; i++) { | |
| 368 msmpeg4_encode_block(s, block[i], i); | |
| 369 } | |
| 370 } | |
| 371 | |
| 372 | |
| 373 /* strongly inspirated from MPEG4, but not exactly the same ! */ | |
| 374 void msmpeg4_dc_scale(MpegEncContext * s) | |
| 375 { | |
|
195
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
376 if (s->qscale < 5){ |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
377 s->y_dc_scale = 8; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
378 s->c_dc_scale = 8; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
379 // s->c_dc_scale = (s->qscale + 13)>>1; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
380 }else if (s->qscale < 9){ |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
381 s->y_dc_scale = 2 * s->qscale; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
382 s->c_dc_scale = (s->qscale + 13)>>1; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
383 }else{ |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
384 s->y_dc_scale = s->qscale + 8; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
385 s->c_dc_scale = (s->qscale + 13)>>1; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
386 } |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
387 // this differs for quant >24 from mpeg4 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
388 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
389 // if(s->qscale==13) s->c_dc_scale=14; |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
390 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
391 // if(s->qscale>=6) |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
392 // printf("%d", s->qscale); |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
393 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
394 /* s->c_dc_scale values (found by Michael Nidermayer) |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
395 qscale=2 -> 8 (yes iam sure about that) |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
396 qscale=3 -> 8 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
397 qscale=4 -> 8 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
398 qscale=5 -> 9 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
399 qscale=6 -> 9 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
400 qscale=7 -> 10 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
401 qscale=8 -> 10 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
402 qscale=9 -> 11 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
403 qscale=10-> 11 |
|
92f726205082
s->c_dc_scale was 7 if s->qscale==2 but should be 8 (the bug is visible in deep red areas in high bitrate clips) - patch by Michael Niedermayer <michaelni@gmx.at>
arpi_esp
parents:
186
diff
changeset
|
404 */ |
| 0 | 405 } |
| 406 | |
| 407 /* dir = 0: left, dir = 1: top prediction */ | |
| 408 static int msmpeg4_pred_dc(MpegEncContext * s, int n, | |
| 25 | 409 INT16 **dc_val_ptr, int *dir_ptr) |
| 0 | 410 { |
| 411 int a, b, c, x, y, wrap, pred, scale; | |
| 25 | 412 INT16 *dc_val; |
| 0 | 413 |
| 414 /* find prediction */ | |
| 415 if (n < 4) { | |
| 416 x = 2 * s->mb_x + 1 + (n & 1); | |
| 417 y = 2 * s->mb_y + 1 + ((n & 2) >> 1); | |
| 418 wrap = s->mb_width * 2 + 2; | |
| 419 dc_val = s->dc_val[0]; | |
| 420 scale = s->y_dc_scale; | |
| 421 } else { | |
| 422 x = s->mb_x + 1; | |
| 423 y = s->mb_y + 1; | |
| 424 wrap = s->mb_width + 2; | |
| 425 dc_val = s->dc_val[n - 4 + 1]; | |
| 426 scale = s->c_dc_scale; | |
| 427 } | |
| 428 | |
| 429 /* B C | |
| 430 * A X | |
| 431 */ | |
| 432 a = dc_val[(x - 1) + (y) * wrap]; | |
| 433 b = dc_val[(x - 1) + (y - 1) * wrap]; | |
| 434 c = dc_val[(x) + (y - 1) * wrap]; | |
| 435 | |
| 436 /* XXX: the following solution consumes divisions, but it does not | |
| 437 necessitate to modify mpegvideo.c. The problem comes from the | |
| 438 fact they decided to store the quantized DC (which would lead | |
| 439 to problems if Q could vary !) */ | |
| 204 | 440 #ifdef ARCH_X86 |
| 441 /* using 16bit divisions as they are large enough and 2x as fast */ | |
| 442 asm volatile( | |
| 443 "movl %3, %%eax \n\t" | |
| 444 "shrl $1, %%eax \n\t" | |
| 445 "addl %%eax, %2 \n\t" | |
| 446 "addl %%eax, %1 \n\t" | |
| 447 "addl %0, %%eax \n\t" | |
| 448 "xorl %%edx, %%edx \n\t" | |
| 449 "divw %w3 \n\t" | |
| 450 "movzwl %%ax, %0 \n\t" | |
| 451 "movl %1, %%eax \n\t" | |
| 452 "xorl %%edx, %%edx \n\t" | |
| 453 "divw %w3 \n\t" | |
| 454 "movzwl %%ax, %1 \n\t" | |
| 455 "movl %2, %%eax \n\t" | |
| 456 "xorl %%edx, %%edx \n\t" | |
| 457 "divw %w3 \n\t" | |
| 458 "movzwl %%ax, %2 \n\t" | |
| 459 : "+r" (a), "+r" (b), "+r" (c) | |
| 460 : "r" (scale) | |
| 461 : "%eax", "%edx" | |
| 462 ); | |
|
214
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
463 #elif defined (ARCH_ALPHA) |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
464 /* Divisions are extremely costly on Alpha; optimize the most |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
465 common case. */ |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
466 if (scale == 8) { |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
467 a = (a + (8 >> 1)) / 8; |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
468 b = (b + (8 >> 1)) / 8; |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
469 c = (c + (8 >> 1)) / 8; |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
470 } else { |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
471 a = (a + (scale >> 1)) / scale; |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
472 b = (b + (scale >> 1)) / scale; |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
473 c = (c + (scale >> 1)) / scale; |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
474 } |
|
73df666cacc7
Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents:
208
diff
changeset
|
475 #else |
| 0 | 476 a = (a + (scale >> 1)) / scale; |
| 477 b = (b + (scale >> 1)) / scale; | |
| 478 c = (c + (scale >> 1)) / scale; | |
| 204 | 479 #endif |
| 0 | 480 /* XXX: WARNING: they did not choose the same test as MPEG4. This |
| 481 is very important ! */ | |
| 482 if (abs(a - b) <= abs(b - c)) { | |
| 483 pred = c; | |
| 484 *dir_ptr = 1; | |
| 485 } else { | |
| 486 pred = a; | |
| 487 *dir_ptr = 0; | |
| 488 } | |
| 489 | |
| 490 /* update predictor */ | |
| 491 *dc_val_ptr = &dc_val[(x) + (y) * wrap]; | |
| 492 return pred; | |
| 493 } | |
| 494 | |
| 495 #define DC_MAX 119 | |
| 496 | |
| 497 static void msmpeg4_encode_dc(MpegEncContext * s, int level, int n, int *dir_ptr) | |
| 498 { | |
| 499 int sign, code; | |
| 500 int pred; | |
| 25 | 501 INT16 *dc_val; |
| 0 | 502 |
| 503 pred = msmpeg4_pred_dc(s, n, &dc_val, dir_ptr); | |
| 504 | |
| 505 /* update predictor */ | |
| 506 if (n < 4) { | |
| 507 *dc_val = level * s->y_dc_scale; | |
| 508 } else { | |
| 509 *dc_val = level * s->c_dc_scale; | |
| 510 } | |
| 511 | |
| 512 /* do the prediction */ | |
| 513 level -= pred; | |
| 514 | |
| 515 sign = 0; | |
| 516 if (level < 0) { | |
| 517 level = -level; | |
| 518 sign = 1; | |
| 519 } | |
| 520 | |
| 521 code = level; | |
| 522 if (code > DC_MAX) | |
| 523 code = DC_MAX; | |
| 524 | |
| 525 if (s->dc_table_index == 0) { | |
| 526 if (n < 4) { | |
| 527 put_bits(&s->pb, table0_dc_lum[code][1], table0_dc_lum[code][0]); | |
| 528 } else { | |
| 529 put_bits(&s->pb, table0_dc_chroma[code][1], table0_dc_chroma[code][0]); | |
| 530 } | |
| 531 } else { | |
| 532 if (n < 4) { | |
| 533 put_bits(&s->pb, table1_dc_lum[code][1], table1_dc_lum[code][0]); | |
| 534 } else { | |
| 535 put_bits(&s->pb, table1_dc_chroma[code][1], table1_dc_chroma[code][0]); | |
| 536 } | |
| 537 } | |
| 538 | |
| 539 if (code == DC_MAX) | |
| 540 put_bits(&s->pb, 8, level); | |
| 541 | |
| 542 if (level != 0) { | |
| 543 put_bits(&s->pb, 1, sign); | |
| 544 } | |
| 545 } | |
| 546 | |
| 547 /* Encoding of a block. Very similar to MPEG4 except for a different | |
| 548 escape coding (same as H263) and more vlc tables. | |
| 549 */ | |
| 550 static void msmpeg4_encode_block(MpegEncContext * s, DCTELEM * block, int n) | |
| 551 { | |
| 552 int level, run, last, i, j, last_index; | |
| 553 int last_non_zero, sign, slevel; | |
| 554 int code, run_diff, dc_pred_dir; | |
| 555 const RLTable *rl; | |
| 556 | |
| 557 if (s->mb_intra) { | |
| 558 set_stat(ST_DC); | |
| 559 msmpeg4_encode_dc(s, block[0], n, &dc_pred_dir); | |
| 560 i = 1; | |
| 561 if (n < 4) { | |
| 562 rl = &rl_table[s->rl_table_index]; | |
| 563 } else { | |
| 564 rl = &rl_table[3 + s->rl_chroma_table_index]; | |
| 565 } | |
| 566 run_diff = 0; | |
| 567 set_stat(ST_INTRA_AC); | |
| 568 } else { | |
| 569 i = 0; | |
| 570 rl = &rl_table[3 + s->rl_table_index]; | |
| 571 run_diff = 1; | |
| 572 set_stat(ST_INTER_AC); | |
| 573 } | |
| 574 | |
| 575 /* AC coefs */ | |
| 576 last_index = s->block_last_index[n]; | |
| 577 last_non_zero = i - 1; | |
| 578 for (; i <= last_index; i++) { | |
| 579 j = zigzag_direct[i]; | |
| 580 level = block[j]; | |
| 581 if (level) { | |
| 582 run = i - last_non_zero - 1; | |
| 583 last = (i == last_index); | |
| 584 sign = 0; | |
| 585 slevel = level; | |
| 586 if (level < 0) { | |
| 587 sign = 1; | |
| 588 level = -level; | |
| 589 } | |
| 590 code = get_rl_index(rl, last, run, level); | |
| 591 put_bits(&s->pb, rl->table_vlc[code][1], rl->table_vlc[code][0]); | |
| 592 if (code == rl->n) { | |
| 593 int level1, run1; | |
| 594 | |
| 595 level1 = level - rl->max_level[last][run]; | |
| 596 if (level1 < 1) | |
| 597 goto esc2; | |
| 598 code = get_rl_index(rl, last, run, level1); | |
| 599 if (code == rl->n) { | |
| 600 esc2: | |
| 601 put_bits(&s->pb, 1, 0); | |
| 602 if (level > MAX_LEVEL) | |
| 603 goto esc3; | |
| 604 run1 = run - rl->max_run[last][level] - run_diff; | |
| 605 if (run1 < 0) | |
| 606 goto esc3; | |
| 607 code = get_rl_index(rl, last, run1, level); | |
| 608 if (code == rl->n) { | |
| 609 esc3: | |
| 610 /* third escape */ | |
| 611 put_bits(&s->pb, 1, 0); | |
| 612 put_bits(&s->pb, 1, last); | |
| 613 put_bits(&s->pb, 6, run); | |
| 614 put_bits(&s->pb, 8, slevel & 0xff); | |
| 615 } else { | |
| 616 /* second escape */ | |
| 617 put_bits(&s->pb, 1, 1); | |
| 618 put_bits(&s->pb, rl->table_vlc[code][1], rl->table_vlc[code][0]); | |
| 619 put_bits(&s->pb, 1, sign); | |
| 620 } | |
| 621 } else { | |
| 622 /* first escape */ | |
| 623 put_bits(&s->pb, 1, 1); | |
| 624 put_bits(&s->pb, rl->table_vlc[code][1], rl->table_vlc[code][0]); | |
| 625 put_bits(&s->pb, 1, sign); | |
| 626 } | |
| 627 } else { | |
| 628 put_bits(&s->pb, 1, sign); | |
| 629 } | |
| 630 last_non_zero = i; | |
| 631 } | |
| 632 } | |
| 633 } | |
| 634 | |
| 635 /****************************************/ | |
| 636 /* decoding stuff */ | |
| 637 | |
| 638 static VLC mb_non_intra_vlc; | |
| 639 static VLC mb_intra_vlc; | |
| 640 static VLC dc_lum_vlc[2]; | |
| 641 static VLC dc_chroma_vlc[2]; | |
| 642 | |
| 643 /* init all vlc decoding tables */ | |
| 644 int msmpeg4_decode_init_vlc(MpegEncContext *s) | |
| 645 { | |
| 646 int i; | |
| 647 MVTable *mv; | |
| 648 | |
| 649 for(i=0;i<NB_RL_TABLES;i++) { | |
| 650 init_rl(&rl_table[i]); | |
| 651 init_vlc_rl(&rl_table[i]); | |
| 652 } | |
| 653 for(i=0;i<2;i++) { | |
| 654 mv = &mv_tables[i]; | |
| 655 init_vlc(&mv->vlc, 9, mv->n + 1, | |
| 656 mv->table_mv_bits, 1, 1, | |
| 657 mv->table_mv_code, 2, 2); | |
| 658 } | |
| 659 | |
| 660 init_vlc(&dc_lum_vlc[0], 9, 120, | |
| 661 &table0_dc_lum[0][1], 8, 4, | |
| 662 &table0_dc_lum[0][0], 8, 4); | |
| 663 init_vlc(&dc_chroma_vlc[0], 9, 120, | |
| 664 &table0_dc_chroma[0][1], 8, 4, | |
| 665 &table0_dc_chroma[0][0], 8, 4); | |
| 666 init_vlc(&dc_lum_vlc[1], 9, 120, | |
| 667 &table1_dc_lum[0][1], 8, 4, | |
| 668 &table1_dc_lum[0][0], 8, 4); | |
| 669 init_vlc(&dc_chroma_vlc[1], 9, 120, | |
| 670 &table1_dc_chroma[0][1], 8, 4, | |
| 671 &table1_dc_chroma[0][0], 8, 4); | |
| 672 | |
| 673 init_vlc(&mb_non_intra_vlc, 9, 128, | |
| 674 &table_mb_non_intra[0][1], 8, 4, | |
| 675 &table_mb_non_intra[0][0], 8, 4); | |
| 48 | 676 init_vlc(&mb_intra_vlc, 9, 64, |
| 0 | 677 &table_mb_intra[0][1], 4, 2, |
| 678 &table_mb_intra[0][0], 4, 2); | |
| 679 return 0; | |
| 680 } | |
| 681 | |
| 682 static int decode012(GetBitContext *gb) | |
| 683 { | |
| 684 int n; | |
| 21 | 685 n = get_bits1(gb); |
| 0 | 686 if (n == 0) |
| 687 return 0; | |
| 688 else | |
| 21 | 689 return get_bits1(gb) + 1; |
| 0 | 690 } |
| 691 | |
| 692 int msmpeg4_decode_picture_header(MpegEncContext * s) | |
| 693 { | |
| 694 int code; | |
| 695 | |
| 696 s->pict_type = get_bits(&s->gb, 2) + 1; | |
| 697 if (s->pict_type != I_TYPE && | |
| 698 s->pict_type != P_TYPE) | |
| 699 return -1; | |
| 700 | |
| 701 s->qscale = get_bits(&s->gb, 5); | |
| 702 | |
| 703 if (s->pict_type == I_TYPE) { | |
| 704 code = get_bits(&s->gb, 5); | |
| 705 /* 0x17: one slice, 0x18: three slices */ | |
| 706 /* XXX: implement it */ | |
| 200 | 707 //printf("%d %d %d\n", code, s->slice_height, s->first_slice_line); |
| 0 | 708 if (code < 0x17) |
| 709 return -1; | |
| 710 s->slice_height = s->mb_height / (code - 0x16); | |
| 711 s->rl_chroma_table_index = decode012(&s->gb); | |
| 712 s->rl_table_index = decode012(&s->gb); | |
| 713 | |
| 21 | 714 s->dc_table_index = get_bits1(&s->gb); |
| 0 | 715 s->no_rounding = 1; |
| 200 | 716 /* printf(" %d %d %d %d \n", |
| 717 s->qscale, | |
| 718 s->rl_chroma_table_index, | |
| 719 s->rl_table_index, | |
| 720 s->dc_table_index);*/ | |
| 0 | 721 } else { |
| 21 | 722 s->use_skip_mb_code = get_bits1(&s->gb); |
| 0 | 723 |
| 724 s->rl_table_index = decode012(&s->gb); | |
| 725 s->rl_chroma_table_index = s->rl_table_index; | |
| 726 | |
| 21 | 727 s->dc_table_index = get_bits1(&s->gb); |
| 0 | 728 |
| 21 | 729 s->mv_table_index = get_bits1(&s->gb); |
| 200 | 730 /* printf(" %d %d %d %d %d \n", |
| 731 s->use_skip_mb_code, | |
| 732 s->rl_table_index, | |
| 733 s->rl_chroma_table_index, | |
| 734 s->dc_table_index, | |
| 735 s->mv_table_index);*/ | |
| 208 | 736 if(s->flipflop_rounding){ |
| 737 s->no_rounding ^= 1; | |
| 738 }else{ | |
| 739 s->no_rounding = 0; | |
| 740 } | |
| 741 // printf("%d", s->no_rounding); | |
| 0 | 742 } |
| 208 | 743 |
| 744 | |
| 0 | 745 #ifdef DEBUG |
| 746 printf("*****frame %d:\n", frame_count++); | |
| 747 #endif | |
| 748 return 0; | |
| 749 } | |
| 750 | |
| 208 | 751 int msmpeg4_decode_ext_header(MpegEncContext * s, int buf_size) |
| 752 { | |
| 753 int firstBit=0; | |
| 754 | |
| 755 /* the alt_bitstream reader could read over the end so we need to check it */ | |
| 756 if(get_bits_count(&s->gb) < buf_size*8) firstBit= get_bits1(&s->gb); | |
| 757 | |
| 758 if(s->pict_type == P_TYPE) | |
| 759 { | |
| 760 if(firstBit) return -1; // havnt seen ext headers in P-Frames yet ;) | |
| 761 } | |
| 762 else | |
| 763 { | |
| 764 int unk; | |
| 765 if(!firstBit) // no header found | |
| 766 { | |
| 767 s->flipflop_rounding= 0; | |
| 768 s->bitrate= 0; | |
| 769 return 0; | |
| 770 } | |
| 771 | |
| 772 unk= get_bits(&s->gb, 4); | |
| 773 s->bitrate= get_bits(&s->gb, 11); | |
| 774 | |
| 775 // printf("%2d %4d ;; %1X\n", unk,s->bitrate, unk); | |
| 776 | |
| 777 s->flipflop_rounding= get_bits1(&s->gb); | |
| 778 } | |
| 779 | |
| 780 return 0; | |
| 781 } | |
| 782 | |
| 0 | 783 void memsetw(short *tab, int val, int n) |
| 784 { | |
| 785 int i; | |
| 786 for(i=0;i<n;i++) | |
| 787 tab[i] = val; | |
| 788 } | |
| 789 | |
| 790 int msmpeg4_decode_mb(MpegEncContext *s, | |
| 791 DCTELEM block[6][64]) | |
| 792 { | |
| 793 int cbp, code, i; | |
| 794 int pred, val; | |
| 795 UINT8 *coded_val; | |
| 796 | |
| 797 /* special slice handling */ | |
| 798 if (s->mb_x == 0) { | |
| 122 | 799 if (s->slice_height && (s->mb_y % s->slice_height) == 0) { |
| 0 | 800 int wrap; |
| 801 /* reset DC pred (set previous line to 1024) */ | |
| 802 wrap = 2 * s->mb_width + 2; | |
| 803 memsetw(&s->dc_val[0][(1) + (2 * s->mb_y) * wrap], | |
| 804 1024, 2 * s->mb_width); | |
| 805 wrap = s->mb_width + 2; | |
| 806 memsetw(&s->dc_val[1][(1) + (s->mb_y) * wrap], | |
| 807 1024, s->mb_width); | |
| 808 memsetw(&s->dc_val[2][(1) + (s->mb_y) * wrap], | |
| 809 1024, s->mb_width); | |
|
186
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
810 |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
811 /* reset AC pred (set previous line to 0) */ |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
812 wrap = s->mb_width * 2 + 2; |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
813 memsetw(s->ac_val[0][0] + (1 + (2 * s->mb_y) * wrap)*16, |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
814 0, 2 * s->mb_width*16); |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
815 wrap = s->mb_width + 2; |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
816 memsetw(s->ac_val[1][0] + (1 + (s->mb_y) * wrap)*16, |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
817 0, s->mb_width*16); |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
818 memsetw(s->ac_val[2][0] + (1 + (s->mb_y) * wrap)*16, |
|
cf37da86d990
fix slices when code=0x18, patch by Michael Niedermayer <michael@mplayer.dev.hu>
arpi_esp
parents:
122
diff
changeset
|
819 0, s->mb_width*16); |
| 0 | 820 |
| 821 s->first_slice_line = 1; | |
| 822 } else { | |
| 823 s->first_slice_line = 0; | |
| 824 } | |
| 825 } | |
| 826 | |
| 827 if (s->pict_type == P_TYPE) { | |
| 828 set_stat(ST_INTER_MB); | |
| 829 if (s->use_skip_mb_code) { | |
| 21 | 830 if (get_bits1(&s->gb)) { |
| 0 | 831 /* skip mb */ |
| 832 s->mb_intra = 0; | |
| 833 for(i=0;i<6;i++) | |
| 834 s->block_last_index[i] = -1; | |
| 835 s->mv_dir = MV_DIR_FORWARD; | |
| 836 s->mv_type = MV_TYPE_16X16; | |
| 837 s->mv[0][0][0] = 0; | |
| 838 s->mv[0][0][1] = 0; | |
|
7
1d3ac9654178
added skip macroblock optimization (big perf win on black regions for example)
glantau
parents:
0
diff
changeset
|
839 s->mb_skiped = 1; |
| 0 | 840 return 0; |
| 841 } | |
| 842 } | |
| 843 | |
| 844 code = get_vlc(&s->gb, &mb_non_intra_vlc); | |
| 845 if (code < 0) | |
| 846 return -1; | |
| 847 if (code & 0x40) | |
| 848 s->mb_intra = 0; | |
| 849 else | |
| 850 s->mb_intra = 1; | |
| 851 | |
| 852 cbp = code & 0x3f; | |
| 853 } else { | |
| 854 set_stat(ST_INTRA_MB); | |
| 855 s->mb_intra = 1; | |
| 856 code = get_vlc(&s->gb, &mb_intra_vlc); | |
| 857 if (code < 0) | |
| 858 return -1; | |
| 859 /* predict coded block pattern */ | |
| 860 cbp = 0; | |
| 861 for(i=0;i<6;i++) { | |
| 862 val = ((code >> (5 - i)) & 1); | |
| 863 if (i < 4) { | |
| 864 pred = coded_block_pred(s, i, &coded_val); | |
| 865 val = val ^ pred; | |
| 866 *coded_val = val; | |
| 867 } | |
| 868 cbp |= val << (5 - i); | |
| 869 } | |
| 870 } | |
| 871 | |
| 872 if (!s->mb_intra) { | |
| 873 int mx, my; | |
| 874 set_stat(ST_MV); | |
| 875 h263_pred_motion(s, 0, &mx, &my); | |
| 876 if (msmpeg4_decode_motion(s, &mx, &my) < 0) | |
| 877 return -1; | |
| 878 s->mv_dir = MV_DIR_FORWARD; | |
| 879 s->mv_type = MV_TYPE_16X16; | |
| 880 s->mv[0][0][0] = mx; | |
| 881 s->mv[0][0][1] = my; | |
| 882 } else { | |
| 883 set_stat(ST_INTRA_MB); | |
| 21 | 884 s->ac_pred = get_bits1(&s->gb); |
| 0 | 885 } |
| 886 | |
| 887 for (i = 0; i < 6; i++) { | |
| 888 if (msmpeg4_decode_block(s, block[i], i, (cbp >> (5 - i)) & 1) < 0) | |
| 889 return -1; | |
| 890 } | |
| 891 return 0; | |
| 892 } | |
| 893 | |
| 894 static int msmpeg4_decode_block(MpegEncContext * s, DCTELEM * block, | |
| 895 int n, int coded) | |
| 896 { | |
| 897 int code, level, i, j, last, run, run_diff; | |
| 898 int dc_pred_dir; | |
| 899 RLTable *rl; | |
| 900 const UINT8 *scan_table; | |
| 200 | 901 int qmul, qadd; |
| 0 | 902 |
| 903 if (s->mb_intra) { | |
| 200 | 904 qmul=1; |
| 905 qadd=0; | |
| 906 | |
| 0 | 907 /* DC coef */ |
| 908 set_stat(ST_DC); | |
| 909 level = msmpeg4_decode_dc(s, n, &dc_pred_dir); | |
| 910 if (level < 0) | |
| 911 return -1; | |
| 912 block[0] = level; | |
| 913 if (n < 4) { | |
| 914 rl = &rl_table[s->rl_table_index]; | |
| 915 } else { | |
| 916 rl = &rl_table[3 + s->rl_chroma_table_index]; | |
| 917 } | |
| 200 | 918 |
| 0 | 919 run_diff = 0; |
| 920 i = 1; | |
| 921 if (!coded) { | |
| 922 goto not_coded; | |
| 923 } | |
| 924 if (s->ac_pred) { | |
| 925 if (dc_pred_dir == 0) | |
| 926 scan_table = ff_alternate_vertical_scan; /* left */ | |
| 927 else | |
| 928 scan_table = ff_alternate_horizontal_scan; /* top */ | |
| 929 } else { | |
| 930 scan_table = zigzag_direct; | |
| 931 } | |
| 932 set_stat(ST_INTRA_AC); | |
| 933 } else { | |
| 200 | 934 qmul = s->qscale << 1; |
| 935 qadd = (s->qscale - 1) | 1; | |
| 0 | 936 i = 0; |
| 937 rl = &rl_table[3 + s->rl_table_index]; | |
| 938 run_diff = 1; | |
| 939 if (!coded) { | |
| 940 s->block_last_index[n] = i - 1; | |
| 941 return 0; | |
| 942 } | |
| 943 scan_table = zigzag_direct; | |
| 944 set_stat(ST_INTER_AC); | |
| 945 } | |
| 946 | |
| 947 for(;;) { | |
| 948 code = get_vlc(&s->gb, &rl->vlc); | |
| 949 if (code < 0) | |
| 950 return -1; | |
| 951 if (code == rl->n) { | |
| 952 /* escape */ | |
| 21 | 953 if (get_bits1(&s->gb) == 0) { |
| 954 if (get_bits1(&s->gb) == 0) { | |
| 0 | 955 /* third escape */ |
| 21 | 956 last = get_bits1(&s->gb); |
| 0 | 957 run = get_bits(&s->gb, 6); |
| 958 level = get_bits(&s->gb, 8); | |
| 959 level = (level << 24) >> 24; /* sign extend */ | |
| 200 | 960 if(level>0) level= level * qmul + qadd; |
| 961 else level= level * qmul - qadd; | |
| 0 | 962 } else { |
| 963 /* second escape */ | |
| 964 code = get_vlc(&s->gb, &rl->vlc); | |
| 965 if (code < 0 || code >= rl->n) | |
| 966 return -1; | |
| 967 run = rl->table_run[code]; | |
| 201 | 968 level = rl->table_level[code]; |
| 0 | 969 last = code >= rl->last; |
| 970 run += rl->max_run[last][level] + run_diff; | |
| 201 | 971 level= level * qmul + qadd; |
| 21 | 972 if (get_bits1(&s->gb)) |
| 0 | 973 level = -level; |
| 974 } | |
| 975 } else { | |
| 976 /* first escape */ | |
| 977 code = get_vlc(&s->gb, &rl->vlc); | |
| 978 if (code < 0 || code >= rl->n) | |
| 979 return -1; | |
| 980 run = rl->table_run[code]; | |
| 981 level = rl->table_level[code]; | |
| 982 last = code >= rl->last; | |
| 983 level += rl->max_level[last][run]; | |
| 200 | 984 level= level * qmul + qadd; |
| 21 | 985 if (get_bits1(&s->gb)) |
| 0 | 986 level = -level; |
| 987 } | |
| 988 } else { | |
| 989 run = rl->table_run[code]; | |
| 200 | 990 level = rl->table_level[code] * qmul + qadd; |
| 0 | 991 last = code >= rl->last; |
| 21 | 992 if (get_bits1(&s->gb)) |
| 0 | 993 level = -level; |
| 994 } | |
| 995 i += run; | |
| 996 if (i >= 64) | |
| 997 return -1; | |
| 998 j = scan_table[i]; | |
| 999 block[j] = level; | |
| 1000 i++; | |
| 1001 if (last) | |
| 1002 break; | |
| 1003 } | |
| 1004 not_coded: | |
| 1005 if (s->mb_intra) { | |
| 1006 mpeg4_pred_ac(s, block, n, dc_pred_dir); | |
| 1007 if (s->ac_pred) { | |
| 1008 i = 64; /* XXX: not optimal */ | |
| 1009 } | |
| 1010 } | |
| 1011 s->block_last_index[n] = i - 1; | |
| 1012 | |
| 1013 return 0; | |
| 1014 } | |
| 1015 | |
| 1016 static int msmpeg4_decode_dc(MpegEncContext * s, int n, int *dir_ptr) | |
| 1017 { | |
| 1018 int level, pred; | |
| 25 | 1019 INT16 *dc_val; |
| 0 | 1020 |
| 1021 if (n < 4) { | |
| 1022 level = get_vlc(&s->gb, &dc_lum_vlc[s->dc_table_index]); | |
| 1023 } else { | |
| 1024 level = get_vlc(&s->gb, &dc_chroma_vlc[s->dc_table_index]); | |
| 1025 } | |
| 1026 if (level < 0) | |
| 1027 return -1; | |
| 1028 | |
| 1029 if (level == DC_MAX) { | |
| 1030 level = get_bits(&s->gb, 8); | |
| 21 | 1031 if (get_bits1(&s->gb)) |
| 0 | 1032 level = -level; |
| 1033 } else if (level != 0) { | |
| 21 | 1034 if (get_bits1(&s->gb)) |
| 0 | 1035 level = -level; |
| 1036 } | |
| 1037 | |
| 1038 pred = msmpeg4_pred_dc(s, n, &dc_val, dir_ptr); | |
| 1039 level += pred; | |
| 1040 | |
| 1041 /* update predictor */ | |
| 1042 if (n < 4) { | |
| 1043 *dc_val = level * s->y_dc_scale; | |
| 1044 } else { | |
| 1045 *dc_val = level * s->c_dc_scale; | |
| 1046 } | |
| 1047 | |
| 1048 return level; | |
| 1049 } | |
| 1050 | |
| 1051 static int msmpeg4_decode_motion(MpegEncContext * s, | |
| 1052 int *mx_ptr, int *my_ptr) | |
| 1053 { | |
| 1054 MVTable *mv; | |
| 1055 int code, mx, my; | |
| 1056 | |
| 1057 mv = &mv_tables[s->mv_table_index]; | |
| 1058 | |
| 1059 code = get_vlc(&s->gb, &mv->vlc); | |
| 1060 if (code < 0) | |
| 1061 return -1; | |
| 1062 if (code == mv->n) { | |
| 1063 mx = get_bits(&s->gb, 6); | |
| 1064 my = get_bits(&s->gb, 6); | |
| 1065 } else { | |
| 1066 mx = mv->table_mvx[code]; | |
| 1067 my = mv->table_mvy[code]; | |
| 1068 } | |
| 1069 | |
| 1070 mx += *mx_ptr - 32; | |
| 1071 my += *my_ptr - 32; | |
| 1072 /* WARNING : they do not do exactly modulo encoding */ | |
| 1073 if (mx <= -64) | |
| 1074 mx += 64; | |
| 1075 else if (mx >= 64) | |
| 1076 mx -= 64; | |
| 1077 | |
| 1078 if (my <= -64) | |
| 1079 my += 64; | |
| 1080 else if (my >= 64) | |
| 1081 my -= 64; | |
| 1082 *mx_ptr = mx; | |
| 1083 *my_ptr = my; | |
| 1084 return 0; | |
| 1085 } |
