Mercurial > libavcodec.hg
annotate mathops.h @ 10874:bcfe2acbf190 libavcodec
AAC: Compress codebook tables and optimise sign bit handling
The codebooks each consist of small number of values repeated in
groups of 2 or 4. Storing the codebooks as a packed list of 2- or
4-bit indexes into a table reduces their size substantially (from 7.5k
to 1.5k), resulting in less cache pressure.
For the band types with sign bits in the bitstream, storing the number
and position of non-zero codebook values using a few bits avoids
multiple get_bits() calls and floating-point comparisons which gcc
handles miserably.
Some float/int type punning also avoids gcc brain damage.
Overall speedup 20-35% on Cortex-A8, 20% on Core i7.
| author | mru |
|---|---|
| date | Wed, 13 Jan 2010 16:46:28 +0000 |
| parents | 42a126c78744 |
| children | 38b3b209b4bc |
| rev | line source |
|---|---|
| 3733 | 1 /* |
| 2 * simple math operations | |
|
8629
04423b2f6e0b
cosmetics: Remove pointless period after copyright statement non-sentences.
diego
parents:
8627
diff
changeset
|
3 * Copyright (c) 2001, 2002 Fabrice Bellard |
| 3733 | 4 * Copyright (c) 2006 Michael Niedermayer <michaelni@gmx.at> et al |
| 5 * | |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3733
diff
changeset
|
6 * This file is part of FFmpeg. |
|
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3733
diff
changeset
|
7 * |
|
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3733
diff
changeset
|
8 * FFmpeg is free software; you can redistribute it and/or |
| 3733 | 9 * modify it under the terms of the GNU Lesser General Public |
| 10 * License as published by the Free Software Foundation; either | |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3733
diff
changeset
|
11 * version 2.1 of the License, or (at your option) any later version. |
| 3733 | 12 * |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3733
diff
changeset
|
13 * FFmpeg is distributed in the hope that it will be useful, |
| 3733 | 14 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
| 16 * Lesser General Public License for more details. | |
| 17 * | |
| 18 * You should have received a copy of the GNU Lesser General Public | |
|
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3733
diff
changeset
|
19 * License along with FFmpeg; if not, write to the Free Software |
| 3733 | 20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
| 21 */ | |
| 7760 | 22 #ifndef AVCODEC_MATHOPS_H |
| 23 #define AVCODEC_MATHOPS_H | |
| 3733 | 24 |
| 6763 | 25 #include "libavutil/common.h" |
| 5162 | 26 |
| 9679 | 27 #if ARCH_ARM |
| 9678 | 28 # include "arm/mathops.h" |
| 10065 | 29 #elif ARCH_AVR32 |
| 30 # include "avr32/mathops.h" | |
| 9679 | 31 #elif ARCH_BFIN |
| 32 # include "bfin/mathops.h" | |
| 9729 | 33 #elif ARCH_MIPS |
| 34 # include "mips/mathops.h" | |
| 8590 | 35 #elif ARCH_PPC |
| 9678 | 36 # include "ppc/mathops.h" |
| 9679 | 37 #elif ARCH_X86 |
| 38 # include "x86/mathops.h" | |
| 3733 | 39 #endif |
| 40 | |
| 41 /* generic implementation */ | |
| 42 | |
| 43 #ifndef MULL | |
| 8201 | 44 # define MULL(a,b,s) (((int64_t)(a) * (int64_t)(b)) >> (s)) |
| 3733 | 45 #endif |
| 46 | |
| 47 #ifndef MULH | |
| 48 //gcc 3.4 creates an incredibly bloated mess out of this | |
| 49 //# define MULH(a,b) (((int64_t)(a) * (int64_t)(b))>>32) | |
| 50 | |
|
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4112
diff
changeset
|
51 static av_always_inline int MULH(int a, int b){ |
| 3733 | 52 return ((int64_t)(a) * (int64_t)(b))>>32; |
| 53 } | |
| 54 #endif | |
| 55 | |
| 56 #ifndef MUL64 | |
| 57 # define MUL64(a,b) ((int64_t)(a) * (int64_t)(b)) | |
| 58 #endif | |
| 59 | |
| 7255 | 60 #ifndef MAC64 |
| 61 # define MAC64(d, a, b) ((d) += MUL64(a, b)) | |
| 62 #endif | |
| 63 | |
| 64 #ifndef MLS64 | |
| 65 # define MLS64(d, a, b) ((d) -= MUL64(a, b)) | |
| 66 #endif | |
| 67 | |
| 3733 | 68 /* signed 16x16 -> 32 multiply add accumulate */ |
| 69 #ifndef MAC16 | |
| 70 # define MAC16(rt, ra, rb) rt += (ra) * (rb) | |
| 71 #endif | |
| 72 | |
| 73 /* signed 16x16 -> 32 multiply */ | |
| 74 #ifndef MUL16 | |
| 75 # define MUL16(ra, rb) ((ra) * (rb)) | |
| 76 #endif | |
| 77 | |
| 7255 | 78 #ifndef MLS16 |
| 79 # define MLS16(rt, ra, rb) ((rt) -= (ra) * (rb)) | |
| 80 #endif | |
| 81 | |
|
8627
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
82 /* median of 3 */ |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
83 #ifndef mid_pred |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
84 #define mid_pred mid_pred |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
85 static inline av_const int mid_pred(int a, int b, int c) |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
86 { |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
87 #if 0 |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
88 int t= (a-b)&((a-b)>>31); |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
89 a-=t; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
90 b+=t; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
91 b-= (b-c)&((b-c)>>31); |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
92 b+= (a-b)&((a-b)>>31); |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
93 |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
94 return b; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
95 #else |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
96 if(a>b){ |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
97 if(c>b){ |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
98 if(c>a) b=a; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
99 else b=c; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
100 } |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
101 }else{ |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
102 if(b>c){ |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
103 if(c>a) b=c; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
104 else b=a; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
105 } |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
106 } |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
107 return b; |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
108 #endif |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
109 } |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
110 #endif |
|
d6bab465b82c
moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents:
8590
diff
changeset
|
111 |
| 9096 | 112 #ifndef sign_extend |
| 113 static inline av_const int sign_extend(int val, unsigned bits) | |
| 114 { | |
| 115 return (val << (INT_BIT - bits)) >> (INT_BIT - bits); | |
| 116 } | |
| 117 #endif | |
| 118 | |
| 7760 | 119 #endif /* AVCODEC_MATHOPS_H */ |
| 3733 | 120 |
