Mercurial > libavcodec.hg
annotate h264.h @ 11032:01bd040f8607 libavcodec
Unroll main loop so the edge==0 case is seperate.
This allows many things to be simplified away.
h264 decoder is overall 1% faster with a mbaff sample and
0.1% slower with the cathedral sample, probably because the slow loop
filter code must be loaded into the code cache for each first MB of each
row but isnt used for the following MBs.
| author | michael |
|---|---|
| date | Thu, 28 Jan 2010 01:24:25 +0000 |
| parents | b37a53d101c3 |
| children | 4aa724a692f5 |
| rev | line source |
|---|---|
| 4975 | 1 /* |
| 2 * H.26L/H.264/AVC/JVT/14496-10/... encoder/decoder | |
| 3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at> | |
| 4 * | |
| 5 * This file is part of FFmpeg. | |
| 6 * | |
| 7 * FFmpeg is free software; you can redistribute it and/or | |
| 8 * modify it under the terms of the GNU Lesser General Public | |
| 9 * License as published by the Free Software Foundation; either | |
| 10 * version 2.1 of the License, or (at your option) any later version. | |
| 11 * | |
| 12 * FFmpeg is distributed in the hope that it will be useful, | |
| 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
| 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
| 15 * Lesser General Public License for more details. | |
| 16 * | |
| 17 * You should have received a copy of the GNU Lesser General Public | |
| 18 * License along with FFmpeg; if not, write to the Free Software | |
| 19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | |
| 20 */ | |
| 21 | |
| 22 /** | |
|
8718
e9d9d946f213
Use full internal pathname in doxygen @file directives.
diego
parents:
8596
diff
changeset
|
23 * @file libavcodec/h264.h |
| 4975 | 24 * H.264 / AVC / MPEG4 part10 codec. |
| 25 * @author Michael Niedermayer <michaelni@gmx.at> | |
| 26 */ | |
| 27 | |
| 7760 | 28 #ifndef AVCODEC_H264_H |
| 29 #define AVCODEC_H264_H | |
| 4975 | 30 |
| 31 #include "dsputil.h" | |
| 32 #include "cabac.h" | |
| 33 #include "mpegvideo.h" | |
|
5638
4a26dc4ca11d
Move H.264 intra prediction functions into their own context
kostya
parents:
5231
diff
changeset
|
34 #include "h264pred.h" |
| 10866 | 35 #include "rectangle.h" |
| 4975 | 36 |
| 37 #define interlaced_dct interlaced_dct_is_a_bad_name | |
| 5129 | 38 #define mb_intra mb_intra_is_not_initialized_see_mb_type |
| 4975 | 39 |
| 40 #define LUMA_DC_BLOCK_INDEX 25 | |
| 41 #define CHROMA_DC_BLOCK_INDEX 26 | |
| 42 | |
| 43 #define CHROMA_DC_COEFF_TOKEN_VLC_BITS 8 | |
| 44 #define COEFF_TOKEN_VLC_BITS 8 | |
| 45 #define TOTAL_ZEROS_VLC_BITS 9 | |
| 46 #define CHROMA_DC_TOTAL_ZEROS_VLC_BITS 3 | |
| 47 #define RUN_VLC_BITS 3 | |
| 48 #define RUN7_VLC_BITS 6 | |
| 49 | |
| 50 #define MAX_SPS_COUNT 32 | |
| 51 #define MAX_PPS_COUNT 256 | |
| 52 | |
| 53 #define MAX_MMCO_COUNT 66 | |
| 54 | |
|
7283
39e81fdd8d23
Move the size of the H264Context delayed_pic array into a #define.
astrange
parents:
7178
diff
changeset
|
55 #define MAX_DELAYED_PIC_COUNT 16 |
|
39e81fdd8d23
Move the size of the H264Context delayed_pic array into a #define.
astrange
parents:
7178
diff
changeset
|
56 |
| 4975 | 57 /* Compiling in interlaced support reduces the speed |
| 58 * of progressive decoding by about 2%. */ | |
| 59 #define ALLOW_INTERLACE | |
| 60 | |
| 7407 | 61 #define ALLOW_NOCHROMA |
| 62 | |
|
8079
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
63 /** |
|
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
64 * The maximum number of slices supported by the decoder. |
|
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
65 * must be a power of 2 |
|
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
66 */ |
|
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
67 #define MAX_SLICES 16 |
|
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
68 |
| 4975 | 69 #ifdef ALLOW_INTERLACE |
| 70 #define MB_MBAFF h->mb_mbaff | |
| 71 #define MB_FIELD h->mb_field_decoding_flag | |
| 72 #define FRAME_MBAFF h->mb_aff_frame | |
| 5801 | 73 #define FIELD_PICTURE (s->picture_structure != PICT_FRAME) |
| 4975 | 74 #else |
| 75 #define MB_MBAFF 0 | |
| 76 #define MB_FIELD 0 | |
| 77 #define FRAME_MBAFF 0 | |
| 5767 | 78 #define FIELD_PICTURE 0 |
| 4975 | 79 #undef IS_INTERLACED |
| 80 #define IS_INTERLACED(mb_type) 0 | |
| 81 #endif | |
|
5781
0b3aa6f4c313
Modifies macroblock addressing and current macroblock y-position for field decoding.
andoma
parents:
5772
diff
changeset
|
82 #define FIELD_OR_MBAFF_PICTURE (FRAME_MBAFF || FIELD_PICTURE) |
| 4975 | 83 |
| 7407 | 84 #ifdef ALLOW_NOCHROMA |
| 85 #define CHROMA h->sps.chroma_format_idc | |
| 86 #else | |
| 87 #define CHROMA 1 | |
| 88 #endif | |
| 89 | |
|
10893
2aafcafbe1f0
Replace cabac checks in inline functions from h264.h with constants.
michael
parents:
10883
diff
changeset
|
90 #ifndef CABAC |
|
2aafcafbe1f0
Replace cabac checks in inline functions from h264.h with constants.
michael
parents:
10883
diff
changeset
|
91 #define CABAC h->pps.cabac |
|
2aafcafbe1f0
Replace cabac checks in inline functions from h264.h with constants.
michael
parents:
10883
diff
changeset
|
92 #endif |
|
2aafcafbe1f0
Replace cabac checks in inline functions from h264.h with constants.
michael
parents:
10883
diff
changeset
|
93 |
|
7988
a7dfe657968d
Move nal unit types enum and EXTENDED_SAR #define from h264data.h to h264.h.
michael
parents:
7906
diff
changeset
|
94 #define EXTENDED_SAR 255 |
|
a7dfe657968d
Move nal unit types enum and EXTENDED_SAR #define from h264data.h to h264.h.
michael
parents:
7906
diff
changeset
|
95 |
|
8207
2f35f9781c31
Move #defines that are mostly used in h264.c out of h264data.h and into h264.h.
diego
parents:
8107
diff
changeset
|
96 #define MB_TYPE_REF0 MB_TYPE_ACPRED //dirty but it fits in 16 bit |
|
2f35f9781c31
Move #defines that are mostly used in h264.c out of h264data.h and into h264.h.
diego
parents:
8107
diff
changeset
|
97 #define MB_TYPE_8x8DCT 0x01000000 |
|
2f35f9781c31
Move #defines that are mostly used in h264.c out of h264data.h and into h264.h.
diego
parents:
8107
diff
changeset
|
98 #define IS_REF0(a) ((a) & MB_TYPE_REF0) |
|
2f35f9781c31
Move #defines that are mostly used in h264.c out of h264data.h and into h264.h.
diego
parents:
8107
diff
changeset
|
99 #define IS_8x8DCT(a) ((a) & MB_TYPE_8x8DCT) |
|
2f35f9781c31
Move #defines that are mostly used in h264.c out of h264data.h and into h264.h.
diego
parents:
8107
diff
changeset
|
100 |
|
10862
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
101 /** |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
102 * Value of Picture.reference when Picture is not a reference picture, but |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
103 * is held for delayed output. |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
104 */ |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
105 #define DELAYED_PIC_REF 4 |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
106 |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
107 |
|
7988
a7dfe657968d
Move nal unit types enum and EXTENDED_SAR #define from h264data.h to h264.h.
michael
parents:
7906
diff
changeset
|
108 /* NAL unit types */ |
|
a7dfe657968d
Move nal unit types enum and EXTENDED_SAR #define from h264data.h to h264.h.
michael
parents:
7906
diff
changeset
|
109 enum { |
| 7990 | 110 NAL_SLICE=1, |
| 111 NAL_DPA, | |
| 112 NAL_DPB, | |
| 113 NAL_DPC, | |
| 114 NAL_IDR_SLICE, | |
| 115 NAL_SEI, | |
| 116 NAL_SPS, | |
| 117 NAL_PPS, | |
| 118 NAL_AUD, | |
| 119 NAL_END_SEQUENCE, | |
| 120 NAL_END_STREAM, | |
| 121 NAL_FILLER_DATA, | |
| 122 NAL_SPS_EXT, | |
| 123 NAL_AUXILIARY_SLICE=19 | |
|
7988
a7dfe657968d
Move nal unit types enum and EXTENDED_SAR #define from h264data.h to h264.h.
michael
parents:
7906
diff
changeset
|
124 }; |
|
a7dfe657968d
Move nal unit types enum and EXTENDED_SAR #define from h264data.h to h264.h.
michael
parents:
7906
diff
changeset
|
125 |
| 4975 | 126 /** |
|
8762
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
127 * SEI message types |
|
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
128 */ |
|
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
129 typedef enum { |
| 8972 | 130 SEI_BUFFERING_PERIOD = 0, ///< buffering period (H.264, D.1.1) |
|
8762
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
131 SEI_TYPE_PIC_TIMING = 1, ///< picture timing |
|
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
132 SEI_TYPE_USER_DATA_UNREGISTERED = 5, ///< unregistered user data |
|
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
133 SEI_TYPE_RECOVERY_POINT = 6 ///< recovery point (frame # to decoder sync) |
|
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
134 } SEI_Type; |
|
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
135 |
|
4f1567ce75c4
Replace hard-coded SEI type constants with symbolic names
superdump
parents:
8740
diff
changeset
|
136 /** |
|
8107
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
137 * pic_struct in picture timing SEI message |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
138 */ |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
139 typedef enum { |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
140 SEI_PIC_STRUCT_FRAME = 0, ///< 0: %frame |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
141 SEI_PIC_STRUCT_TOP_FIELD = 1, ///< 1: top field |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
142 SEI_PIC_STRUCT_BOTTOM_FIELD = 2, ///< 2: bottom field |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
143 SEI_PIC_STRUCT_TOP_BOTTOM = 3, ///< 3: top field, bottom field, in that order |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
144 SEI_PIC_STRUCT_BOTTOM_TOP = 4, ///< 4: bottom field, top field, in that order |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
145 SEI_PIC_STRUCT_TOP_BOTTOM_TOP = 5, ///< 5: top field, bottom field, top field repeated, in that order |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
146 SEI_PIC_STRUCT_BOTTOM_TOP_BOTTOM = 6, ///< 6: bottom field, top field, bottom field repeated, in that order |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
147 SEI_PIC_STRUCT_FRAME_DOUBLING = 7, ///< 7: %frame doubling |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
148 SEI_PIC_STRUCT_FRAME_TRIPLING = 8 ///< 8: %frame tripling |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
149 } SEI_PicStructType; |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
150 |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
151 /** |
| 4975 | 152 * Sequence parameter set |
| 153 */ | |
| 154 typedef struct SPS{ | |
| 155 | |
| 156 int profile_idc; | |
| 157 int level_idc; | |
| 7407 | 158 int chroma_format_idc; |
| 4975 | 159 int transform_bypass; ///< qpprime_y_zero_transform_bypass_flag |
| 160 int log2_max_frame_num; ///< log2_max_frame_num_minus4 + 4 | |
| 161 int poc_type; ///< pic_order_cnt_type | |
| 162 int log2_max_poc_lsb; ///< log2_max_pic_order_cnt_lsb_minus4 | |
| 163 int delta_pic_order_always_zero_flag; | |
| 164 int offset_for_non_ref_pic; | |
| 165 int offset_for_top_to_bottom_field; | |
| 166 int poc_cycle_length; ///< num_ref_frames_in_pic_order_cnt_cycle | |
| 167 int ref_frame_count; ///< num_ref_frames | |
| 168 int gaps_in_frame_num_allowed_flag; | |
|
5755
b45894d869da
Cosmetic preparations for h264/PAFF implementation.
andoma
parents:
5642
diff
changeset
|
169 int mb_width; ///< pic_width_in_mbs_minus1 + 1 |
|
b45894d869da
Cosmetic preparations for h264/PAFF implementation.
andoma
parents:
5642
diff
changeset
|
170 int mb_height; ///< pic_height_in_map_units_minus1 + 1 |
| 4975 | 171 int frame_mbs_only_flag; |
| 172 int mb_aff; ///<mb_adaptive_frame_field_flag | |
| 173 int direct_8x8_inference_flag; | |
| 174 int crop; ///< frame_cropping_flag | |
|
6582
7d40da88f0c7
Crop parameters are unsigned, having them negative could be bad and lead
michael
parents:
6488
diff
changeset
|
175 unsigned int crop_left; ///< frame_cropping_rect_left_offset |
|
7d40da88f0c7
Crop parameters are unsigned, having them negative could be bad and lead
michael
parents:
6488
diff
changeset
|
176 unsigned int crop_right; ///< frame_cropping_rect_right_offset |
|
7d40da88f0c7
Crop parameters are unsigned, having them negative could be bad and lead
michael
parents:
6488
diff
changeset
|
177 unsigned int crop_top; ///< frame_cropping_rect_top_offset |
|
7d40da88f0c7
Crop parameters are unsigned, having them negative could be bad and lead
michael
parents:
6488
diff
changeset
|
178 unsigned int crop_bottom; ///< frame_cropping_rect_bottom_offset |
| 4975 | 179 int vui_parameters_present_flag; |
| 180 AVRational sar; | |
|
10837
e5905bfa625d
Export fullrange flag and color information for h.264
conrad
parents:
10829
diff
changeset
|
181 int video_signal_type_present_flag; |
|
e5905bfa625d
Export fullrange flag and color information for h.264
conrad
parents:
10829
diff
changeset
|
182 int full_range; |
|
e5905bfa625d
Export fullrange flag and color information for h.264
conrad
parents:
10829
diff
changeset
|
183 int colour_description_present_flag; |
|
e5905bfa625d
Export fullrange flag and color information for h.264
conrad
parents:
10829
diff
changeset
|
184 enum AVColorPrimaries color_primaries; |
|
e5905bfa625d
Export fullrange flag and color information for h.264
conrad
parents:
10829
diff
changeset
|
185 enum AVColorTransferCharacteristic color_trc; |
|
e5905bfa625d
Export fullrange flag and color information for h.264
conrad
parents:
10829
diff
changeset
|
186 enum AVColorSpace colorspace; |
| 4975 | 187 int timing_info_present_flag; |
| 188 uint32_t num_units_in_tick; | |
| 189 uint32_t time_scale; | |
| 190 int fixed_frame_rate_flag; | |
| 191 short offset_for_ref_frame[256]; //FIXME dyn aloc? | |
| 192 int bitstream_restriction_flag; | |
| 193 int num_reorder_frames; | |
| 194 int scaling_matrix_present; | |
| 195 uint8_t scaling_matrix4[6][16]; | |
| 196 uint8_t scaling_matrix8[2][64]; | |
|
8107
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
197 int nal_hrd_parameters_present_flag; |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
198 int vcl_hrd_parameters_present_flag; |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
199 int pic_struct_present_flag; |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
200 int time_offset_length; |
| 8970 | 201 int cpb_cnt; ///< See H.264 E.1.2 |
| 8965 | 202 int initial_cpb_removal_delay_length; ///< initial_cpb_removal_delay_length_minus1 +1 |
|
8107
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
203 int cpb_removal_delay_length; ///< cpb_removal_delay_length_minus1 + 1 |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
204 int dpb_output_delay_length; ///< dpb_output_delay_length_minus1 + 1 |
|
8735
5d7ebbb7e91b
Add fields to H264Context and SPS for upcoming VA API support.
cehoyos
parents:
8718
diff
changeset
|
205 int bit_depth_luma; ///< bit_depth_luma_minus8 + 8 |
|
5d7ebbb7e91b
Add fields to H264Context and SPS for upcoming VA API support.
cehoyos
parents:
8718
diff
changeset
|
206 int bit_depth_chroma; ///< bit_depth_chroma_minus8 + 8 |
|
5d7ebbb7e91b
Add fields to H264Context and SPS for upcoming VA API support.
cehoyos
parents:
8718
diff
changeset
|
207 int residual_color_transform_flag; ///< residual_colour_transform_flag |
| 4975 | 208 }SPS; |
| 209 | |
| 210 /** | |
| 211 * Picture parameter set | |
| 212 */ | |
| 213 typedef struct PPS{ | |
| 214 unsigned int sps_id; | |
| 215 int cabac; ///< entropy_coding_mode_flag | |
| 216 int pic_order_present; ///< pic_order_present_flag | |
| 217 int slice_group_count; ///< num_slice_groups_minus1 + 1 | |
| 218 int mb_slice_group_map_type; | |
| 219 unsigned int ref_count[2]; ///< num_ref_idx_l0/1_active_minus1 + 1 | |
| 220 int weighted_pred; ///< weighted_pred_flag | |
| 221 int weighted_bipred_idc; | |
| 222 int init_qp; ///< pic_init_qp_minus26 + 26 | |
| 223 int init_qs; ///< pic_init_qs_minus26 + 26 | |
|
5231
07a97575d0c4
Add support for streams with different chroma_qp_index_offset
gpoirier
parents:
5226
diff
changeset
|
224 int chroma_qp_index_offset[2]; |
| 4975 | 225 int deblocking_filter_parameters_present; ///< deblocking_filter_parameters_present_flag |
| 226 int constrained_intra_pred; ///< constrained_intra_pred_flag | |
| 227 int redundant_pic_cnt_present; ///< redundant_pic_cnt_present_flag | |
| 228 int transform_8x8_mode; ///< transform_8x8_mode_flag | |
| 229 uint8_t scaling_matrix4[6][16]; | |
| 230 uint8_t scaling_matrix8[2][64]; | |
|
7347
612a78c3b128
qscale has a range of 0..51 we thus do not need a 256 entry table and neither need
michael
parents:
7343
diff
changeset
|
231 uint8_t chroma_qp_table[2][64]; ///< pre-scaled (with chroma_qp_index_offset) version of qp_table |
|
5231
07a97575d0c4
Add support for streams with different chroma_qp_index_offset
gpoirier
parents:
5226
diff
changeset
|
232 int chroma_qp_diff; |
| 4975 | 233 }PPS; |
| 234 | |
| 235 /** | |
| 236 * Memory management control operation opcode. | |
| 237 */ | |
| 238 typedef enum MMCOOpcode{ | |
| 239 MMCO_END=0, | |
| 240 MMCO_SHORT2UNUSED, | |
| 241 MMCO_LONG2UNUSED, | |
| 242 MMCO_SHORT2LONG, | |
| 243 MMCO_SET_MAX_LONG, | |
| 244 MMCO_RESET, | |
| 245 MMCO_LONG, | |
| 246 } MMCOOpcode; | |
| 247 | |
| 248 /** | |
| 249 * Memory management control operation. | |
| 250 */ | |
| 251 typedef struct MMCO{ | |
| 252 MMCOOpcode opcode; | |
|
5756
db5a041fd77c
Rename MMCO stuff to prepare for h264/PAFF implementation.
andoma
parents:
5755
diff
changeset
|
253 int short_pic_num; ///< pic_num without wrapping (pic_num & max_pic_num) |
|
db5a041fd77c
Rename MMCO stuff to prepare for h264/PAFF implementation.
andoma
parents:
5755
diff
changeset
|
254 int long_arg; ///< index, pic_num, or num long refs depending on opcode |
| 4975 | 255 } MMCO; |
| 256 | |
| 257 /** | |
| 258 * H264Context | |
| 259 */ | |
| 260 typedef struct H264Context{ | |
| 261 MpegEncContext s; | |
| 262 int nal_ref_idc; | |
| 263 int nal_unit_type; | |
| 5174 | 264 uint8_t *rbsp_buffer[2]; |
| 265 unsigned int rbsp_buffer_size[2]; | |
| 4975 | 266 |
| 267 /** | |
| 268 * Used to parse AVC variant of h264 | |
| 269 */ | |
| 270 int is_avc; ///< this flag is != 0 if codec is avc1 | |
| 271 int got_avcC; ///< flag used to parse avcC data only once | |
| 272 int nal_length_size; ///< Number of bytes used for nal length (1, 2 or 4) | |
| 273 | |
|
5231
07a97575d0c4
Add support for streams with different chroma_qp_index_offset
gpoirier
parents:
5226
diff
changeset
|
274 int chroma_qp[2]; //QPc |
| 4975 | 275 |
|
10896
f112b4d030fa
Avoid wasting 4 cpu cycles per MB in redundantly calculating qp_thresh.
michael
parents:
10893
diff
changeset
|
276 int qp_thresh; ///< QP threshold to skip loopfilter |
|
f112b4d030fa
Avoid wasting 4 cpu cycles per MB in redundantly calculating qp_thresh.
michael
parents:
10893
diff
changeset
|
277 |
| 4975 | 278 int prev_mb_skipped; |
| 279 int next_mb_skipped; | |
| 280 | |
| 281 //prediction stuff | |
| 282 int chroma_pred_mode; | |
| 283 int intra16x16_pred_mode; | |
| 284 | |
| 285 int top_mb_xy; | |
| 286 int left_mb_xy[2]; | |
| 287 | |
|
11012
b2fd83b26dd9
Set top & left types for deblock in fill_caches().
michael
parents:
11010
diff
changeset
|
288 int top_type; |
|
b2fd83b26dd9
Set top & left types for deblock in fill_caches().
michael
parents:
11010
diff
changeset
|
289 int left_type[2]; |
|
b2fd83b26dd9
Set top & left types for deblock in fill_caches().
michael
parents:
11010
diff
changeset
|
290 |
| 4975 | 291 int8_t intra4x4_pred_mode_cache[5*8]; |
| 292 int8_t (*intra4x4_pred_mode)[8]; | |
|
5638
4a26dc4ca11d
Move H.264 intra prediction functions into their own context
kostya
parents:
5231
diff
changeset
|
293 H264PredContext hpc; |
| 4975 | 294 unsigned int topleft_samples_available; |
| 295 unsigned int top_samples_available; | |
| 296 unsigned int topright_samples_available; | |
| 297 unsigned int left_samples_available; | |
| 298 uint8_t (*top_borders[2])[16+2*8]; | |
| 299 uint8_t left_border[2*(17+2*9)]; | |
| 300 | |
| 301 /** | |
| 302 * non zero coeff count cache. | |
| 303 * is 64 if not available. | |
| 304 */ | |
|
10961
34a65026fa06
Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents:
10934
diff
changeset
|
305 DECLARE_ALIGNED_8(uint8_t, non_zero_count_cache)[6*8]; |
|
10909
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
306 |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
307 /* |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
308 .UU.YYYY |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
309 .UU.YYYY |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
310 .vv.YYYY |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
311 .VV.YYYY |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
312 */ |
| 10906 | 313 uint8_t (*non_zero_count)[32]; |
| 4975 | 314 |
| 315 /** | |
| 316 * Motion vector cache. | |
| 317 */ | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
318 DECLARE_ALIGNED_16(int16_t, mv_cache)[2][5*8][2]; |
|
10961
34a65026fa06
Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents:
10934
diff
changeset
|
319 DECLARE_ALIGNED_8(int8_t, ref_cache)[2][5*8]; |
| 4975 | 320 #define LIST_NOT_USED -1 //FIXME rename? |
| 321 #define PART_NOT_AVAILABLE -2 | |
| 322 | |
| 323 /** | |
| 324 * is 1 if the specific list MV&references are set to 0,0,-2. | |
| 325 */ | |
| 326 int mv_cache_clean[2]; | |
| 327 | |
| 328 /** | |
| 329 * number of neighbors (top and/or left) that used 8x8 dct | |
| 330 */ | |
| 331 int neighbor_transform_size; | |
| 332 | |
| 333 /** | |
| 334 * block_offset[ 0..23] for frame macroblocks | |
| 335 * block_offset[24..47] for field macroblocks | |
| 336 */ | |
| 337 int block_offset[2*(16+8)]; | |
| 338 | |
| 339 uint32_t *mb2b_xy; //FIXME are these 4 a good idea? | |
| 340 uint32_t *mb2b8_xy; | |
| 341 int b_stride; //FIXME use s->b4_stride | |
| 342 int b8_stride; | |
| 343 | |
| 344 int mb_linesize; ///< may be equal to s->linesize or s->linesize*2, for mbaff | |
| 345 int mb_uvlinesize; | |
| 346 | |
| 347 int emu_edge_width; | |
| 348 int emu_edge_height; | |
| 349 | |
| 350 int halfpel_flag; | |
| 351 int thirdpel_flag; | |
| 352 | |
| 353 int unknown_svq3_flag; | |
| 354 int next_slice_index; | |
| 355 | |
| 5079 | 356 SPS *sps_buffers[MAX_SPS_COUNT]; |
| 4975 | 357 SPS sps; ///< current sps |
| 358 | |
| 5079 | 359 PPS *pps_buffers[MAX_PPS_COUNT]; |
| 4975 | 360 /** |
| 361 * current pps | |
| 362 */ | |
| 363 PPS pps; //FIXME move to Picture perhaps? (->no) do we need that? | |
| 364 | |
| 365 uint32_t dequant4_buffer[6][52][16]; | |
| 366 uint32_t dequant8_buffer[2][52][64]; | |
| 367 uint32_t (*dequant4_coeff[6])[16]; | |
| 368 uint32_t (*dequant8_coeff[2])[64]; | |
| 369 int dequant_coeff_pps; ///< reinit tables when pps changes | |
| 370 | |
| 371 int slice_num; | |
|
8079
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
372 uint16_t *slice_table_base; |
|
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
373 uint16_t *slice_table; ///< slice_table_base + 2*mb_stride + 1 |
| 4975 | 374 int slice_type; |
| 7338 | 375 int slice_type_nos; ///< S free slice type (SI/SP are remapped to I/P) |
| 4975 | 376 int slice_type_fixed; |
| 377 | |
| 378 //interlacing specific flags | |
| 379 int mb_aff_frame; | |
| 380 int mb_field_decoding_flag; | |
| 381 int mb_mbaff; ///< mb_aff_frame && mb_field_decoding_flag | |
| 382 | |
|
10961
34a65026fa06
Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents:
10934
diff
changeset
|
383 DECLARE_ALIGNED_8(uint16_t, sub_mb_type)[4]; |
| 4975 | 384 |
| 385 //POC stuff | |
| 386 int poc_lsb; | |
| 387 int poc_msb; | |
| 388 int delta_poc_bottom; | |
| 389 int delta_poc[2]; | |
| 390 int frame_num; | |
| 391 int prev_poc_msb; ///< poc_msb of the last reference pic for POC type 0 | |
| 392 int prev_poc_lsb; ///< poc_lsb of the last reference pic for POC type 0 | |
| 393 int frame_num_offset; ///< for POC type 2 | |
| 394 int prev_frame_num_offset; ///< for POC type 2 | |
| 395 int prev_frame_num; ///< frame_num of the last pic for POC type 1/2 | |
| 396 | |
| 397 /** | |
|
5772
65b71bd21a4d
Fix h->curr_pic_num for field pictures. Necessary for proper PAFF support.
andoma
parents:
5767
diff
changeset
|
398 * frame_num for frames or 2*frame_num+1 for field pics. |
| 4975 | 399 */ |
| 400 int curr_pic_num; | |
| 401 | |
| 402 /** | |
| 403 * max_frame_num or 2*max_frame_num for field pics. | |
| 404 */ | |
| 405 int max_pic_num; | |
| 406 | |
| 407 //Weighted pred stuff | |
| 408 int use_weight; | |
| 409 int use_weight_chroma; | |
| 410 int luma_log2_weight_denom; | |
| 411 int chroma_log2_weight_denom; | |
| 412 int luma_weight[2][48]; | |
| 413 int luma_offset[2][48]; | |
| 414 int chroma_weight[2][48][2]; | |
| 415 int chroma_offset[2][48][2]; | |
| 416 int implicit_weight[48][48]; | |
| 417 | |
| 418 //deblock | |
| 419 int deblocking_filter; ///< disable_deblocking_filter_idc with 1<->0 | |
| 420 int slice_alpha_c0_offset; | |
| 421 int slice_beta_offset; | |
| 422 | |
| 423 int redundant_pic_count; | |
| 424 | |
| 425 int direct_spatial_mv_pred; | |
| 426 int dist_scale_factor[16]; | |
|
7898
a33287a39a55
Make MBAFF temporal direct mode closer to the spec.
michael
parents:
7760
diff
changeset
|
427 int dist_scale_factor_field[2][32]; |
|
7906
5be944626072
Another try to fix temporal direct mode references.
michael
parents:
7898
diff
changeset
|
428 int map_col_to_list0[2][16+32]; |
|
5be944626072
Another try to fix temporal direct mode references.
michael
parents:
7898
diff
changeset
|
429 int map_col_to_list0_field[2][2][16+32]; |
| 4975 | 430 |
| 431 /** | |
| 432 * num_ref_idx_l0/1_active_minus1 + 1 | |
| 433 */ | |
| 434 unsigned int ref_count[2]; ///< counts frames or fields, depending on current mb mode | |
| 435 unsigned int list_count; | |
| 10906 | 436 uint8_t *list_counts; ///< Array of list_count per MB specifying the slice type |
| 4975 | 437 Picture *short_ref[32]; |
| 438 Picture *long_ref[32]; | |
|
5755
b45894d869da
Cosmetic preparations for h264/PAFF implementation.
andoma
parents:
5642
diff
changeset
|
439 Picture default_ref_list[2][32]; ///< base reference list for all slices of a coded picture |
|
b45894d869da
Cosmetic preparations for h264/PAFF implementation.
andoma
parents:
5642
diff
changeset
|
440 Picture ref_list[2][48]; /**< 0..15: frame refs, 16..47: mbaff field refs. |
|
b45894d869da
Cosmetic preparations for h264/PAFF implementation.
andoma
parents:
5642
diff
changeset
|
441 Reordered version of default_ref_list |
|
b45894d869da
Cosmetic preparations for h264/PAFF implementation.
andoma
parents:
5642
diff
changeset
|
442 according to picture reordering in slice header */ |
|
8079
2d3c7cd7d143
Replace literally hardcoded max slice number by named constant.
michael
parents:
8025
diff
changeset
|
443 int ref2frm[MAX_SLICES][2][64]; ///< reference to frame number lists, used in the loop filter, the first 2 are for -2,-1 |
|
7283
39e81fdd8d23
Move the size of the H264Context delayed_pic array into a #define.
astrange
parents:
7178
diff
changeset
|
444 Picture *delayed_pic[MAX_DELAYED_PIC_COUNT+2]; //FIXME size? |
|
7310
033d10927d45
Remove delayed_output_pic, I do not understand what this variable was good for.
michael
parents:
7283
diff
changeset
|
445 int outputed_poc; |
| 4975 | 446 |
| 447 /** | |
| 448 * memory management control operations buffer. | |
| 449 */ | |
| 450 MMCO mmco[MAX_MMCO_COUNT]; | |
| 451 int mmco_index; | |
| 452 | |
| 453 int long_ref_count; ///< number of actual long term references | |
| 454 int short_ref_count; ///< number of actual short term references | |
| 455 | |
| 456 //data partitioning | |
| 457 GetBitContext intra_gb; | |
| 458 GetBitContext inter_gb; | |
| 459 GetBitContext *intra_gb_ptr; | |
| 460 GetBitContext *inter_gb_ptr; | |
| 461 | |
|
10961
34a65026fa06
Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents:
10934
diff
changeset
|
462 DECLARE_ALIGNED_16(DCTELEM, mb)[16*24]; |
| 6488 | 463 DCTELEM mb_padding[256]; ///< as mb is addressed by scantable[i] and scantable is uint8_t we can either check that i is not too large or ensure that there is some unused stuff after mb |
| 4975 | 464 |
| 465 /** | |
| 466 * Cabac | |
| 467 */ | |
| 468 CABACContext cabac; | |
| 469 uint8_t cabac_state[460]; | |
| 470 int cabac_init_idc; | |
| 471 | |
| 472 /* 0x100 -> non null luma_dc, 0x80/0x40 -> non null chroma_dc (cb/cr), 0x?0 -> chroma_cbp(0,1,2), 0x0? luma_cbp */ | |
| 473 uint16_t *cbp_table; | |
| 474 int cbp; | |
| 475 int top_cbp; | |
| 476 int left_cbp; | |
| 477 /* chroma_pred_mode for i4x4 or i16x16, else 0 */ | |
| 478 uint8_t *chroma_pred_mode_table; | |
| 479 int last_qscale_diff; | |
| 480 int16_t (*mvd_table[2])[2]; | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
481 DECLARE_ALIGNED_16(int16_t, mvd_cache)[2][5*8][2]; |
| 4975 | 482 uint8_t *direct_table; |
| 483 uint8_t direct_cache[5*8]; | |
| 484 | |
| 485 uint8_t zigzag_scan[16]; | |
| 486 uint8_t zigzag_scan8x8[64]; | |
| 487 uint8_t zigzag_scan8x8_cavlc[64]; | |
| 488 uint8_t field_scan[16]; | |
| 489 uint8_t field_scan8x8[64]; | |
| 490 uint8_t field_scan8x8_cavlc[64]; | |
| 491 const uint8_t *zigzag_scan_q0; | |
| 492 const uint8_t *zigzag_scan8x8_q0; | |
| 493 const uint8_t *zigzag_scan8x8_cavlc_q0; | |
| 494 const uint8_t *field_scan_q0; | |
| 495 const uint8_t *field_scan8x8_q0; | |
| 496 const uint8_t *field_scan8x8_cavlc_q0; | |
| 497 | |
| 498 int x264_build; | |
| 5642 | 499 |
| 500 /** | |
| 501 * @defgroup multithreading Members for slice based multithreading | |
| 502 * @{ | |
| 503 */ | |
| 504 struct H264Context *thread_context[MAX_THREADS]; | |
| 505 | |
| 506 /** | |
| 507 * current slice number, used to initalize slice_num of each thread/context | |
| 508 */ | |
| 509 int current_slice; | |
| 510 | |
| 511 /** | |
| 512 * Max number of threads / contexts. | |
| 513 * This is equal to AVCodecContext.thread_count unless | |
| 514 * multithreaded decoding is impossible, in which case it is | |
| 515 * reduced to 1. | |
| 516 */ | |
| 517 int max_contexts; | |
| 518 | |
| 519 /** | |
| 520 * 1 if the single thread fallback warning has already been | |
| 521 * displayed, 0 otherwise. | |
| 522 */ | |
| 523 int single_decode_warning; | |
| 524 | |
| 525 int last_slice_type; | |
| 526 /** @} */ | |
| 527 | |
|
6783
df0893f4fd86
Store mb_xy in H264Context and only calculate it once per MB.
astrange
parents:
6582
diff
changeset
|
528 int mb_xy; |
|
df0893f4fd86
Store mb_xy in H264Context and only calculate it once per MB.
astrange
parents:
6582
diff
changeset
|
529 |
| 8025 | 530 uint32_t svq3_watermark_key; |
|
8107
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
531 |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
532 /** |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
533 * pic_struct in picture timing SEI message |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
534 */ |
|
e61f76efc9f3
h264: Implement decoding of picture timing SEI message.
andoma
parents:
8079
diff
changeset
|
535 SEI_PicStructType sei_pic_struct; |
|
8353
add1a0d65370
Do not recalculate constant part of is_complex for every MB.
michael
parents:
8207
diff
changeset
|
536 |
|
8783
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
537 /** |
|
9831
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
538 * Complement sei_pic_struct |
|
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
539 * SEI_PIC_STRUCT_TOP_BOTTOM and SEI_PIC_STRUCT_BOTTOM_TOP indicate interlaced frames. |
|
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
540 * However, soft telecined frames may have these values. |
|
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
541 * This is used in an attempt to flag soft telecine progressive. |
|
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
542 */ |
|
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
543 int prev_interlaced_frame; |
|
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
544 |
|
febe1855b64a
Add field prev_interlaced_frame to H264Context to be able to flag soft telecine
cehoyos
parents:
9384
diff
changeset
|
545 /** |
|
9128
793cf8c68c4f
Add support for ct_type to correctly detect interlaced flag
schreter
parents:
9071
diff
changeset
|
546 * Bit set of clock types for fields/frames in picture timing SEI message. |
|
793cf8c68c4f
Add support for ct_type to correctly detect interlaced flag
schreter
parents:
9071
diff
changeset
|
547 * For each found ct_type, appropriate bit is set (e.g., bit 1 for |
|
793cf8c68c4f
Add support for ct_type to correctly detect interlaced flag
schreter
parents:
9071
diff
changeset
|
548 * interlaced). |
|
793cf8c68c4f
Add support for ct_type to correctly detect interlaced flag
schreter
parents:
9071
diff
changeset
|
549 */ |
|
793cf8c68c4f
Add support for ct_type to correctly detect interlaced flag
schreter
parents:
9071
diff
changeset
|
550 int sei_ct_type; |
|
793cf8c68c4f
Add support for ct_type to correctly detect interlaced flag
schreter
parents:
9071
diff
changeset
|
551 |
|
793cf8c68c4f
Add support for ct_type to correctly detect interlaced flag
schreter
parents:
9071
diff
changeset
|
552 /** |
| 8966 | 553 * dpb_output_delay in picture timing SEI message, see H.264 C.2.2 |
| 554 */ | |
| 555 int sei_dpb_output_delay; | |
| 556 | |
| 557 /** | |
| 8967 | 558 * cpb_removal_delay in picture timing SEI message, see H.264 C.1.2 |
| 559 */ | |
| 560 int sei_cpb_removal_delay; | |
| 561 | |
| 562 /** | |
|
8783
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
563 * recovery_frame_cnt from SEI message |
|
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
564 * |
|
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
565 * Set to -1 if no recovery point SEI message found or to number of frames |
|
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
566 * before playback synchronizes. Frames having recovery point are key |
|
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
567 * frames. |
|
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
568 */ |
|
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
569 int sei_recovery_frame_cnt; |
|
e91ea98d868a
Add SEI recovery point frame counter to H264Context and use it when
cehoyos
parents:
8762
diff
changeset
|
570 |
|
8353
add1a0d65370
Do not recalculate constant part of is_complex for every MB.
michael
parents:
8207
diff
changeset
|
571 int is_complex; |
|
8735
5d7ebbb7e91b
Add fields to H264Context and SPS for upcoming VA API support.
cehoyos
parents:
8718
diff
changeset
|
572 |
|
5d7ebbb7e91b
Add fields to H264Context and SPS for upcoming VA API support.
cehoyos
parents:
8718
diff
changeset
|
573 int luma_weight_flag[2]; ///< 7.4.3.2 luma_weight_lX_flag |
|
5d7ebbb7e91b
Add fields to H264Context and SPS for upcoming VA API support.
cehoyos
parents:
8718
diff
changeset
|
574 int chroma_weight_flag[2]; ///< 7.4.3.2 chroma_weight_lX_flag |
| 8972 | 575 |
| 576 // Timestamp stuff | |
| 577 int sei_buffering_period_present; ///< Buffering period SEI flag | |
| 578 int initial_cpb_removal_delay[32]; ///< Initial timestamps for CPBs | |
| 4975 | 579 }H264Context; |
| 580 | |
|
10859
762e6bb0ba40
Split (picture|seq) parameter set decoding out of h264.c.
michael
parents:
10858
diff
changeset
|
581 |
|
762e6bb0ba40
Split (picture|seq) parameter set decoding out of h264.c.
michael
parents:
10858
diff
changeset
|
582 extern const uint8_t ff_h264_chroma_qp[52]; |
|
762e6bb0ba40
Split (picture|seq) parameter set decoding out of h264.c.
michael
parents:
10858
diff
changeset
|
583 |
| 11031 | 584 void ff_svq3_luma_dc_dequant_idct_c(DCTELEM *block, int qp); |
| 585 | |
| 586 void ff_svq3_add_idct_c(uint8_t *dst, DCTELEM *block, int stride, int qp, int dc); | |
|
10859
762e6bb0ba40
Split (picture|seq) parameter set decoding out of h264.c.
michael
parents:
10858
diff
changeset
|
587 |
|
8996
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
588 /** |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
589 * Decode SEI |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
590 */ |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
591 int ff_h264_decode_sei(H264Context *h); |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
592 |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
593 /** |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
594 * Decode SPS |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
595 */ |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
596 int ff_h264_decode_seq_parameter_set(H264Context *h); |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
597 |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
598 /** |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
599 * Decode PPS |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
600 */ |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
601 int ff_h264_decode_picture_parameter_set(H264Context *h, int bit_length); |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
602 |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
603 /** |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
604 * Decodes a network abstraction layer unit. |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
605 * @param consumed is the number of bytes used as input |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
606 * @param length is the length of the array |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
607 * @param dst_length is the number of decoded bytes FIXME here or a decode rbsp tailing? |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
608 * @returns decoded bytes, might be src+1 if no escapes |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
609 */ |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
610 const uint8_t *ff_h264_decode_nal(H264Context *h, const uint8_t *src, int *dst_length, int *consumed, int length); |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
611 |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
612 /** |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
613 * identifies the exact end of the bitstream |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
614 * @return the length of the trailing, or 0 if damaged |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
615 */ |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
616 int ff_h264_decode_rbsp_trailing(H264Context *h, const uint8_t *src); |
|
e65778184ded
Make the following H264 functions available to the parser:
cehoyos
parents:
8972
diff
changeset
|
617 |
|
9380
54e650136c87
Add a ff_h264_free_context function and call it from the H.264 parser.
reimar
parents:
9128
diff
changeset
|
618 /** |
|
54e650136c87
Add a ff_h264_free_context function and call it from the H.264 parser.
reimar
parents:
9128
diff
changeset
|
619 * frees any data that may have been allocated in the H264 context like SPS, PPS etc. |
|
54e650136c87
Add a ff_h264_free_context function and call it from the H.264 parser.
reimar
parents:
9128
diff
changeset
|
620 */ |
|
9384
828d15d322ed
Add forgotten void return type to ff_h264_free_context
reimar
parents:
9380
diff
changeset
|
621 av_cold void ff_h264_free_context(H264Context *h); |
|
9380
54e650136c87
Add a ff_h264_free_context function and call it from the H.264 parser.
reimar
parents:
9128
diff
changeset
|
622 |
|
10829
46a247e54d6e
Export get_slice_type() as ff_h264_get_slice_type().
ramiro
parents:
9831
diff
changeset
|
623 /** |
|
46a247e54d6e
Export get_slice_type() as ff_h264_get_slice_type().
ramiro
parents:
9831
diff
changeset
|
624 * reconstructs bitstream slice_type. |
|
46a247e54d6e
Export get_slice_type() as ff_h264_get_slice_type().
ramiro
parents:
9831
diff
changeset
|
625 */ |
|
10987
85de0c8a19b7
Added a missing const to ff_h264_get_slice_type().
fenrir
parents:
10985
diff
changeset
|
626 int ff_h264_get_slice_type(const H264Context *h); |
|
10829
46a247e54d6e
Export get_slice_type() as ff_h264_get_slice_type().
ramiro
parents:
9831
diff
changeset
|
627 |
| 10852 | 628 /** |
| 629 * allocates tables. | |
| 630 * needs width/height | |
| 631 */ | |
| 632 int ff_h264_alloc_tables(H264Context *h); | |
| 633 | |
| 634 /** | |
|
10862
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
635 * fills the default_ref_list. |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
636 */ |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
637 int ff_h264_fill_default_ref_list(H264Context *h); |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
638 |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
639 int ff_h264_decode_ref_pic_list_reordering(H264Context *h); |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
640 void ff_h264_fill_mbaff_ref_list(H264Context *h); |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
641 void ff_h264_remove_all_refs(H264Context *h); |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
642 |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
643 /** |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
644 * Executes the reference picture marking (memory management control operations). |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
645 */ |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
646 int ff_h264_execute_ref_pic_marking(H264Context *h, MMCO *mmco, int mmco_count); |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
647 |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
648 int ff_h264_decode_ref_pic_marking(H264Context *h, GetBitContext *gb); |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
649 |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
650 |
|
d9c084a0c22b
Split all the reference picture handling off h264.c.
michael
parents:
10859
diff
changeset
|
651 /** |
| 10852 | 652 * checks if the top & left blocks are available if needed & changes the dc mode so it only uses the available blocks. |
| 653 */ | |
|
10863
974ac220c93a
Move check_intra4x4_pred_mode() back from h264.h to h264.c, the function is just
michael
parents:
10862
diff
changeset
|
654 int ff_h264_check_intra4x4_pred_mode(H264Context *h); |
|
974ac220c93a
Move check_intra4x4_pred_mode() back from h264.h to h264.c, the function is just
michael
parents:
10862
diff
changeset
|
655 |
|
974ac220c93a
Move check_intra4x4_pred_mode() back from h264.h to h264.c, the function is just
michael
parents:
10862
diff
changeset
|
656 /** |
|
974ac220c93a
Move check_intra4x4_pred_mode() back from h264.h to h264.c, the function is just
michael
parents:
10862
diff
changeset
|
657 * checks if the top & left blocks are available if needed & changes the dc mode so it only uses the available blocks. |
|
974ac220c93a
Move check_intra4x4_pred_mode() back from h264.h to h264.c, the function is just
michael
parents:
10862
diff
changeset
|
658 */ |
| 10852 | 659 int ff_h264_check_intra_pred_mode(H264Context *h, int mode); |
| 660 | |
| 661 void ff_h264_write_back_intra_pred_mode(H264Context *h); | |
| 662 void ff_h264_hl_decode_mb(H264Context *h); | |
| 663 int ff_h264_frame_start(H264Context *h); | |
| 664 av_cold int ff_h264_decode_init(AVCodecContext *avctx); | |
| 665 av_cold int ff_h264_decode_end(AVCodecContext *avctx); | |
| 10866 | 666 av_cold void ff_h264_decode_init_vlc(void); |
| 667 | |
| 668 /** | |
| 669 * decodes a macroblock | |
| 670 * @returns 0 if OK, AC_ERROR / DC_ERROR / MV_ERROR if an error is noticed | |
| 671 */ | |
| 672 int ff_h264_decode_mb_cavlc(H264Context *h); | |
| 10852 | 673 |
| 10869 | 674 /** |
| 675 * decodes a CABAC coded macroblock | |
| 676 * @returns 0 if OK, AC_ERROR / DC_ERROR / MV_ERROR if an error is noticed | |
| 677 */ | |
| 678 int ff_h264_decode_mb_cabac(H264Context *h); | |
| 679 | |
| 680 void ff_h264_init_cabac_states(H264Context *h); | |
| 681 | |
|
10857
b20434143fd5
Split direct mode (macro)block decoding off h264.c.
michael
parents:
10854
diff
changeset
|
682 void ff_h264_direct_dist_scale_factor(H264Context * const h); |
|
b20434143fd5
Split direct mode (macro)block decoding off h264.c.
michael
parents:
10854
diff
changeset
|
683 void ff_h264_direct_ref_list_init(H264Context * const h); |
|
b20434143fd5
Split direct mode (macro)block decoding off h264.c.
michael
parents:
10854
diff
changeset
|
684 void ff_h264_pred_direct_motion(H264Context * const h, int *mb_type); |
|
b20434143fd5
Split direct mode (macro)block decoding off h264.c.
michael
parents:
10854
diff
changeset
|
685 |
| 10854 | 686 void ff_h264_filter_mb_fast( H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize); |
| 687 void ff_h264_filter_mb( H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize); | |
| 688 | |
| 10858 | 689 /** |
| 690 * Reset SEI values at the beginning of the frame. | |
| 691 * | |
| 692 * @param h H.264 context. | |
| 693 */ | |
| 694 void ff_h264_reset_sei(H264Context *h); | |
| 695 | |
| 696 | |
| 10852 | 697 /* |
| 698 o-o o-o | |
| 699 / / / | |
| 700 o-o o-o | |
| 701 ,---' | |
| 702 o-o o-o | |
| 703 / / / | |
| 704 o-o o-o | |
| 705 */ | |
| 706 //This table must be here because scan8[constant] must be known at compiletime | |
| 707 static const uint8_t scan8[16 + 2*4]={ | |
| 708 4+1*8, 5+1*8, 4+2*8, 5+2*8, | |
| 709 6+1*8, 7+1*8, 6+2*8, 7+2*8, | |
| 710 4+3*8, 5+3*8, 4+4*8, 5+4*8, | |
| 711 6+3*8, 7+3*8, 6+4*8, 7+4*8, | |
| 712 1+1*8, 2+1*8, | |
| 713 1+2*8, 2+2*8, | |
| 714 1+4*8, 2+4*8, | |
| 715 1+5*8, 2+5*8, | |
| 716 }; | |
| 717 | |
| 718 static av_always_inline uint32_t pack16to32(int a, int b){ | |
| 719 #if HAVE_BIGENDIAN | |
| 720 return (b&0xFFFF) + (a<<16); | |
| 721 #else | |
| 722 return (a&0xFFFF) + (b<<16); | |
| 723 #endif | |
| 724 } | |
| 725 | |
| 726 /** | |
| 10854 | 727 * gets the chroma qp. |
| 728 */ | |
| 729 static inline int get_chroma_qp(H264Context *h, int t, int qscale){ | |
| 730 return h->pps.chroma_qp_table[t][qscale]; | |
| 731 } | |
| 732 | |
| 10866 | 733 static inline void pred_pskip_motion(H264Context * const h, int * const mx, int * const my); |
| 734 | |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
735 static void fill_decode_caches(H264Context *h, int mb_type){ |
| 10866 | 736 MpegEncContext * const s = &h->s; |
| 737 const int mb_xy= h->mb_xy; | |
| 738 int topleft_xy, top_xy, topright_xy, left_xy[2]; | |
| 739 int topleft_type, top_type, topright_type, left_type[2]; | |
| 740 const uint8_t * left_block; | |
| 741 int topleft_partition= -1; | |
| 742 int i; | |
|
10909
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
743 static const uint8_t left_block_options[4][16]={ |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
744 {0,1,2,3,7,10,8,11,7+0*8, 7+1*8, 7+2*8, 7+3*8, 2+0*8, 2+3*8, 2+1*8, 2+2*8}, |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
745 {2,2,3,3,8,11,8,11,7+2*8, 7+2*8, 7+3*8, 7+3*8, 2+1*8, 2+2*8, 2+1*8, 2+2*8}, |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
746 {0,0,1,1,7,10,7,10,7+0*8, 7+0*8, 7+1*8, 7+1*8, 2+0*8, 2+3*8, 2+0*8, 2+3*8}, |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
747 {0,2,0,2,7,10,7,10,7+0*8, 7+2*8, 7+0*8, 7+2*8, 2+0*8, 2+3*8, 2+0*8, 2+3*8} |
| 10866 | 748 }; |
| 749 | |
|
11008
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
750 top_xy = mb_xy - (s->mb_stride << MB_FIELD); |
| 10866 | 751 |
| 752 /* Wow, what a mess, why didn't they simplify the interlacing & intra | |
| 753 * stuff, I can't imagine that these complex rules are worth it. */ | |
| 754 | |
| 755 topleft_xy = top_xy - 1; | |
| 756 topright_xy= top_xy + 1; | |
| 757 left_xy[1] = left_xy[0] = mb_xy-1; | |
| 758 left_block = left_block_options[0]; | |
| 759 if(FRAME_MBAFF){ | |
|
11008
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
760 const int left_mb_field_flag = IS_INTERLACED(s->current_picture.mb_type[mb_xy-1]); |
| 10866 | 761 const int curr_mb_field_flag = IS_INTERLACED(mb_type); |
|
11008
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
762 if(s->mb_y&1){ |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
763 if (left_mb_field_flag != curr_mb_field_flag) { |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
764 left_xy[1] = left_xy[0] = mb_xy - s->mb_stride - 1; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
765 if (curr_mb_field_flag) { |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
766 left_xy[1] += s->mb_stride; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
767 left_block = left_block_options[3]; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
768 } else { |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
769 topleft_xy += s->mb_stride; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
770 // take top left mv from the middle of the mb, as opposed to all other modes which use the bottom right partition |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
771 topleft_partition = 0; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
772 left_block = left_block_options[1]; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
773 } |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
774 } |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
775 }else{ |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
776 if(curr_mb_field_flag){ |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
777 topleft_xy += s->mb_stride & (((s->current_picture.mb_type[top_xy - 1]>>7)&1)-1); |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
778 topright_xy += s->mb_stride & (((s->current_picture.mb_type[top_xy + 1]>>7)&1)-1); |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
779 top_xy += s->mb_stride & (((s->current_picture.mb_type[top_xy ]>>7)&1)-1); |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
780 } |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
781 if (left_mb_field_flag != curr_mb_field_flag) { |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
782 left_xy[1] = left_xy[0] = mb_xy - 1; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
783 if (curr_mb_field_flag) { |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
784 left_xy[1] += s->mb_stride; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
785 left_block = left_block_options[3]; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
786 } else { |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
787 left_block = left_block_options[2]; |
|
ec192d9ebac5
Optimize mb neighbor initialization for MBAFF in fill_caches().
michael
parents:
11002
diff
changeset
|
788 } |
| 10866 | 789 } |
| 790 } | |
| 791 } | |
| 792 | |
| 793 h->top_mb_xy = top_xy; | |
| 794 h->left_mb_xy[0] = left_xy[0]; | |
| 795 h->left_mb_xy[1] = left_xy[1]; | |
| 796 topleft_type = h->slice_table[topleft_xy ] == h->slice_num ? s->current_picture.mb_type[topleft_xy] : 0; | |
| 797 top_type = h->slice_table[top_xy ] == h->slice_num ? s->current_picture.mb_type[top_xy] : 0; | |
| 798 topright_type= h->slice_table[topright_xy] == h->slice_num ? s->current_picture.mb_type[topright_xy]: 0; | |
| 799 left_type[0] = h->slice_table[left_xy[0] ] == h->slice_num ? s->current_picture.mb_type[left_xy[0]] : 0; | |
| 800 left_type[1] = h->slice_table[left_xy[1] ] == h->slice_num ? s->current_picture.mb_type[left_xy[1]] : 0; | |
| 801 | |
| 10928 | 802 if(IS_INTRA(mb_type)){ |
| 803 int type_mask= h->pps.constrained_intra_pred ? IS_INTRA(-1) : -1; | |
| 804 h->topleft_samples_available= | |
| 805 h->top_samples_available= | |
| 806 h->left_samples_available= 0xFFFF; | |
| 807 h->topright_samples_available= 0xEEEA; | |
| 10866 | 808 |
| 10928 | 809 if(!(top_type & type_mask)){ |
| 810 h->topleft_samples_available= 0xB3FF; | |
| 811 h->top_samples_available= 0x33FF; | |
| 812 h->topright_samples_available= 0x26EA; | |
| 813 } | |
| 814 if(IS_INTERLACED(mb_type) != IS_INTERLACED(left_type[0])){ | |
| 815 if(IS_INTERLACED(mb_type)){ | |
| 816 if(!(left_type[0] & type_mask)){ | |
| 817 h->topleft_samples_available&= 0xDFFF; | |
| 818 h->left_samples_available&= 0x5FFF; | |
| 819 } | |
| 820 if(!(left_type[1] & type_mask)){ | |
| 821 h->topleft_samples_available&= 0xFF5F; | |
| 822 h->left_samples_available&= 0xFF5F; | |
| 823 } | |
| 824 }else{ | |
| 825 int left_typei = h->slice_table[left_xy[0] + s->mb_stride ] == h->slice_num | |
| 826 ? s->current_picture.mb_type[left_xy[0] + s->mb_stride] : 0; | |
| 827 assert(left_xy[0] == left_xy[1]); | |
| 828 if(!((left_typei & type_mask) && (left_type[0] & type_mask))){ | |
| 829 h->topleft_samples_available&= 0xDF5F; | |
| 830 h->left_samples_available&= 0x5F5F; | |
| 831 } | |
| 10866 | 832 } |
| 833 }else{ | |
| 10928 | 834 if(!(left_type[0] & type_mask)){ |
| 10866 | 835 h->topleft_samples_available&= 0xDF5F; |
| 836 h->left_samples_available&= 0x5F5F; | |
| 837 } | |
| 838 } | |
| 839 | |
| 10928 | 840 if(!(topleft_type & type_mask)) |
| 841 h->topleft_samples_available&= 0x7FFF; | |
| 10866 | 842 |
| 10928 | 843 if(!(topright_type & type_mask)) |
| 844 h->topright_samples_available&= 0xFBFF; | |
| 10866 | 845 |
| 10928 | 846 if(IS_INTRA4x4(mb_type)){ |
| 847 if(IS_INTRA4x4(top_type)){ | |
| 848 h->intra4x4_pred_mode_cache[4+8*0]= h->intra4x4_pred_mode[top_xy][4]; | |
| 849 h->intra4x4_pred_mode_cache[5+8*0]= h->intra4x4_pred_mode[top_xy][5]; | |
| 850 h->intra4x4_pred_mode_cache[6+8*0]= h->intra4x4_pred_mode[top_xy][6]; | |
| 851 h->intra4x4_pred_mode_cache[7+8*0]= h->intra4x4_pred_mode[top_xy][3]; | |
| 10866 | 852 }else{ |
| 853 int pred; | |
| 10928 | 854 if(!(top_type & type_mask)) |
| 10866 | 855 pred= -1; |
| 856 else{ | |
| 857 pred= 2; | |
| 858 } | |
| 10928 | 859 h->intra4x4_pred_mode_cache[4+8*0]= |
| 860 h->intra4x4_pred_mode_cache[5+8*0]= | |
| 861 h->intra4x4_pred_mode_cache[6+8*0]= | |
| 862 h->intra4x4_pred_mode_cache[7+8*0]= pred; | |
| 863 } | |
| 864 for(i=0; i<2; i++){ | |
| 865 if(IS_INTRA4x4(left_type[i])){ | |
| 866 h->intra4x4_pred_mode_cache[3+8*1 + 2*8*i]= h->intra4x4_pred_mode[left_xy[i]][left_block[0+2*i]]; | |
| 867 h->intra4x4_pred_mode_cache[3+8*2 + 2*8*i]= h->intra4x4_pred_mode[left_xy[i]][left_block[1+2*i]]; | |
| 868 }else{ | |
| 869 int pred; | |
| 870 if(!(left_type[i] & type_mask)) | |
| 871 pred= -1; | |
| 872 else{ | |
| 873 pred= 2; | |
| 874 } | |
| 875 h->intra4x4_pred_mode_cache[3+8*1 + 2*8*i]= | |
| 876 h->intra4x4_pred_mode_cache[3+8*2 + 2*8*i]= pred; | |
| 877 } | |
| 10866 | 878 } |
| 879 } | |
| 880 } | |
| 881 | |
| 882 | |
| 883 /* | |
| 884 0 . T T. T T T T | |
| 885 1 L . .L . . . . | |
| 886 2 L . .L . . . . | |
| 887 3 . T TL . . . . | |
| 888 4 L . .L . . . . | |
| 889 5 L . .. . . . . | |
| 890 */ | |
| 891 //FIXME constraint_intra_pred & partitioning & nnz (let us hope this is just a typo in the spec) | |
| 892 if(top_type){ | |
|
10909
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
893 *(uint32_t*)&h->non_zero_count_cache[4+8*0]= *(uint32_t*)&h->non_zero_count[top_xy][4+3*8]; |
| 10928 | 894 h->non_zero_count_cache[1+8*0]= h->non_zero_count[top_xy][1+1*8]; |
| 895 h->non_zero_count_cache[2+8*0]= h->non_zero_count[top_xy][2+1*8]; | |
| 10866 | 896 |
| 10928 | 897 h->non_zero_count_cache[1+8*3]= h->non_zero_count[top_xy][1+2*8]; |
| 898 h->non_zero_count_cache[2+8*3]= h->non_zero_count[top_xy][2+2*8]; | |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
899 }else { |
| 10928 | 900 h->non_zero_count_cache[1+8*0]= |
| 901 h->non_zero_count_cache[2+8*0]= | |
| 10866 | 902 |
| 10928 | 903 h->non_zero_count_cache[1+8*3]= |
| 904 h->non_zero_count_cache[2+8*3]= | |
| 905 *(uint32_t*)&h->non_zero_count_cache[4+8*0]= CABAC && !IS_INTRA(mb_type) ? 0 : 0x40404040; | |
| 10866 | 906 } |
| 907 | |
| 908 for (i=0; i<2; i++) { | |
| 909 if(left_type[i]){ | |
|
10909
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
910 h->non_zero_count_cache[3+8*1 + 2*8*i]= h->non_zero_count[left_xy[i]][left_block[8+0+2*i]]; |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
911 h->non_zero_count_cache[3+8*2 + 2*8*i]= h->non_zero_count[left_xy[i]][left_block[8+1+2*i]]; |
| 10928 | 912 h->non_zero_count_cache[0+8*1 + 8*i]= h->non_zero_count[left_xy[i]][left_block[8+4+2*i]]; |
| 913 h->non_zero_count_cache[0+8*4 + 8*i]= h->non_zero_count[left_xy[i]][left_block[8+5+2*i]]; | |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
914 }else{ |
| 10928 | 915 h->non_zero_count_cache[3+8*1 + 2*8*i]= |
| 916 h->non_zero_count_cache[3+8*2 + 2*8*i]= | |
| 917 h->non_zero_count_cache[0+8*1 + 8*i]= | |
| 918 h->non_zero_count_cache[0+8*4 + 8*i]= CABAC && !IS_INTRA(mb_type) ? 0 : 64; | |
| 10866 | 919 } |
| 920 } | |
| 921 | |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
922 if( CABAC ) { |
| 10866 | 923 // top_cbp |
| 924 if(top_type) { | |
| 925 h->top_cbp = h->cbp_table[top_xy]; | |
| 926 } else if(IS_INTRA(mb_type)) { | |
| 927 h->top_cbp = 0x1C0; | |
| 928 } else { | |
| 929 h->top_cbp = 0; | |
| 930 } | |
| 931 // left_cbp | |
| 932 if (left_type[0]) { | |
| 933 h->left_cbp = h->cbp_table[left_xy[0]] & 0x1f0; | |
| 934 } else if(IS_INTRA(mb_type)) { | |
| 935 h->left_cbp = 0x1C0; | |
| 936 } else { | |
| 937 h->left_cbp = 0; | |
| 938 } | |
| 939 if (left_type[0]) { | |
| 940 h->left_cbp |= ((h->cbp_table[left_xy[0]]>>((left_block[0]&(~1))+1))&0x1) << 1; | |
| 941 } | |
| 942 if (left_type[1]) { | |
| 943 h->left_cbp |= ((h->cbp_table[left_xy[1]]>>((left_block[2]&(~1))+1))&0x1) << 3; | |
| 944 } | |
| 945 } | |
| 946 | |
| 947 #if 1 | |
| 948 if(IS_INTER(mb_type) || IS_DIRECT(mb_type)){ | |
| 949 int list; | |
| 950 for(list=0; list<h->list_count; list++){ | |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
951 if(!USES_LIST(mb_type, list) && !IS_DIRECT(mb_type)){ |
| 10866 | 952 /*if(!h->mv_cache_clean[list]){ |
| 953 memset(h->mv_cache [list], 0, 8*5*2*sizeof(int16_t)); //FIXME clean only input? clean at all? | |
| 954 memset(h->ref_cache[list], PART_NOT_AVAILABLE, 8*5*sizeof(int8_t)); | |
| 955 h->mv_cache_clean[list]= 1; | |
| 956 }*/ | |
| 957 continue; | |
| 958 } | |
| 959 h->mv_cache_clean[list]= 0; | |
| 960 | |
| 961 if(USES_LIST(top_type, list)){ | |
| 962 const int b_xy= h->mb2b_xy[top_xy] + 3*h->b_stride; | |
| 963 const int b8_xy= h->mb2b8_xy[top_xy] + h->b8_stride; | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
964 AV_COPY128(h->mv_cache[list][scan8[0] + 0 - 1*8], s->current_picture.motion_val[list][b_xy + 0]); |
| 10928 | 965 h->ref_cache[list][scan8[0] + 0 - 1*8]= |
| 966 h->ref_cache[list][scan8[0] + 1 - 1*8]= s->current_picture.ref_index[list][b8_xy + 0]; | |
| 967 h->ref_cache[list][scan8[0] + 2 - 1*8]= | |
| 968 h->ref_cache[list][scan8[0] + 3 - 1*8]= s->current_picture.ref_index[list][b8_xy + 1]; | |
| 10866 | 969 }else{ |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
970 AV_ZERO128(h->mv_cache[list][scan8[0] + 0 - 1*8]); |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
971 *(uint32_t*)&h->ref_cache[list][scan8[0] + 0 - 1*8]= ((top_type ? LIST_NOT_USED : PART_NOT_AVAILABLE)&0xFF)*0x01010101; |
| 10866 | 972 } |
| 973 | |
| 974 for(i=0; i<2; i++){ | |
| 975 int cache_idx = scan8[0] - 1 + i*2*8; | |
| 976 if(USES_LIST(left_type[i], list)){ | |
| 977 const int b_xy= h->mb2b_xy[left_xy[i]] + 3; | |
| 978 const int b8_xy= h->mb2b8_xy[left_xy[i]] + 1; | |
| 979 *(uint32_t*)h->mv_cache[list][cache_idx ]= *(uint32_t*)s->current_picture.motion_val[list][b_xy + h->b_stride*left_block[0+i*2]]; | |
| 980 *(uint32_t*)h->mv_cache[list][cache_idx+8]= *(uint32_t*)s->current_picture.motion_val[list][b_xy + h->b_stride*left_block[1+i*2]]; | |
| 10928 | 981 h->ref_cache[list][cache_idx ]= s->current_picture.ref_index[list][b8_xy + h->b8_stride*(left_block[0+i*2]>>1)]; |
| 982 h->ref_cache[list][cache_idx+8]= s->current_picture.ref_index[list][b8_xy + h->b8_stride*(left_block[1+i*2]>>1)]; | |
| 10866 | 983 }else{ |
| 984 *(uint32_t*)h->mv_cache [list][cache_idx ]= | |
| 985 *(uint32_t*)h->mv_cache [list][cache_idx+8]= 0; | |
| 986 h->ref_cache[list][cache_idx ]= | |
| 11019 | 987 h->ref_cache[list][cache_idx+8]= (left_type[i]) ? LIST_NOT_USED : PART_NOT_AVAILABLE; |
| 10866 | 988 } |
| 989 } | |
| 990 | |
| 11019 | 991 if((IS_DIRECT(mb_type) && !h->direct_spatial_mv_pred) && !FRAME_MBAFF) |
| 10866 | 992 continue; |
| 993 | |
| 994 if(USES_LIST(topleft_type, list)){ | |
| 995 const int b_xy = h->mb2b_xy[topleft_xy] + 3 + h->b_stride + (topleft_partition & 2*h->b_stride); | |
| 996 const int b8_xy= h->mb2b8_xy[topleft_xy] + 1 + (topleft_partition & h->b8_stride); | |
| 997 *(uint32_t*)h->mv_cache[list][scan8[0] - 1 - 1*8]= *(uint32_t*)s->current_picture.motion_val[list][b_xy]; | |
| 998 h->ref_cache[list][scan8[0] - 1 - 1*8]= s->current_picture.ref_index[list][b8_xy]; | |
| 999 }else{ | |
| 1000 *(uint32_t*)h->mv_cache[list][scan8[0] - 1 - 1*8]= 0; | |
| 1001 h->ref_cache[list][scan8[0] - 1 - 1*8]= topleft_type ? LIST_NOT_USED : PART_NOT_AVAILABLE; | |
| 1002 } | |
| 1003 | |
| 1004 if(USES_LIST(topright_type, list)){ | |
| 1005 const int b_xy= h->mb2b_xy[topright_xy] + 3*h->b_stride; | |
| 1006 const int b8_xy= h->mb2b8_xy[topright_xy] + h->b8_stride; | |
| 1007 *(uint32_t*)h->mv_cache[list][scan8[0] + 4 - 1*8]= *(uint32_t*)s->current_picture.motion_val[list][b_xy]; | |
| 1008 h->ref_cache[list][scan8[0] + 4 - 1*8]= s->current_picture.ref_index[list][b8_xy]; | |
| 1009 }else{ | |
| 1010 *(uint32_t*)h->mv_cache [list][scan8[0] + 4 - 1*8]= 0; | |
| 1011 h->ref_cache[list][scan8[0] + 4 - 1*8]= topright_type ? LIST_NOT_USED : PART_NOT_AVAILABLE; | |
| 1012 } | |
| 1013 | |
| 1014 if((IS_SKIP(mb_type) || IS_DIRECT(mb_type)) && !FRAME_MBAFF) | |
| 1015 continue; | |
| 1016 | |
| 1017 h->ref_cache[list][scan8[5 ]+1] = | |
| 1018 h->ref_cache[list][scan8[7 ]+1] = | |
| 1019 h->ref_cache[list][scan8[13]+1] = //FIXME remove past 3 (init somewhere else) | |
| 1020 h->ref_cache[list][scan8[4 ]] = | |
| 1021 h->ref_cache[list][scan8[12]] = PART_NOT_AVAILABLE; | |
| 1022 *(uint32_t*)h->mv_cache [list][scan8[5 ]+1]= | |
| 1023 *(uint32_t*)h->mv_cache [list][scan8[7 ]+1]= | |
| 1024 *(uint32_t*)h->mv_cache [list][scan8[13]+1]= //FIXME remove past 3 (init somewhere else) | |
| 1025 *(uint32_t*)h->mv_cache [list][scan8[4 ]]= | |
| 1026 *(uint32_t*)h->mv_cache [list][scan8[12]]= 0; | |
| 1027 | |
|
10893
2aafcafbe1f0
Replace cabac checks in inline functions from h264.h with constants.
michael
parents:
10883
diff
changeset
|
1028 if( CABAC ) { |
| 10866 | 1029 /* XXX beurk, Load mvd */ |
| 1030 if(USES_LIST(top_type, list)){ | |
| 1031 const int b_xy= h->mb2b_xy[top_xy] + 3*h->b_stride; | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1032 AV_COPY128(h->mvd_cache[list][scan8[0] + 0 - 1*8], h->mvd_table[list][b_xy + 0]); |
| 10866 | 1033 }else{ |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1034 AV_ZERO128(h->mvd_cache[list][scan8[0] + 0 - 1*8]); |
| 10866 | 1035 } |
| 1036 if(USES_LIST(left_type[0], list)){ | |
| 1037 const int b_xy= h->mb2b_xy[left_xy[0]] + 3; | |
| 1038 *(uint32_t*)h->mvd_cache[list][scan8[0] - 1 + 0*8]= *(uint32_t*)h->mvd_table[list][b_xy + h->b_stride*left_block[0]]; | |
| 1039 *(uint32_t*)h->mvd_cache[list][scan8[0] - 1 + 1*8]= *(uint32_t*)h->mvd_table[list][b_xy + h->b_stride*left_block[1]]; | |
| 1040 }else{ | |
| 1041 *(uint32_t*)h->mvd_cache [list][scan8[0] - 1 + 0*8]= | |
| 1042 *(uint32_t*)h->mvd_cache [list][scan8[0] - 1 + 1*8]= 0; | |
| 1043 } | |
| 1044 if(USES_LIST(left_type[1], list)){ | |
| 1045 const int b_xy= h->mb2b_xy[left_xy[1]] + 3; | |
| 1046 *(uint32_t*)h->mvd_cache[list][scan8[0] - 1 + 2*8]= *(uint32_t*)h->mvd_table[list][b_xy + h->b_stride*left_block[2]]; | |
| 1047 *(uint32_t*)h->mvd_cache[list][scan8[0] - 1 + 3*8]= *(uint32_t*)h->mvd_table[list][b_xy + h->b_stride*left_block[3]]; | |
| 1048 }else{ | |
| 1049 *(uint32_t*)h->mvd_cache [list][scan8[0] - 1 + 2*8]= | |
| 1050 *(uint32_t*)h->mvd_cache [list][scan8[0] - 1 + 3*8]= 0; | |
| 1051 } | |
| 1052 *(uint32_t*)h->mvd_cache [list][scan8[5 ]+1]= | |
| 1053 *(uint32_t*)h->mvd_cache [list][scan8[7 ]+1]= | |
| 1054 *(uint32_t*)h->mvd_cache [list][scan8[13]+1]= //FIXME remove past 3 (init somewhere else) | |
| 1055 *(uint32_t*)h->mvd_cache [list][scan8[4 ]]= | |
| 1056 *(uint32_t*)h->mvd_cache [list][scan8[12]]= 0; | |
| 1057 | |
| 1058 if(h->slice_type_nos == FF_B_TYPE){ | |
| 1059 fill_rectangle(&h->direct_cache[scan8[0]], 4, 4, 8, 0, 1); | |
| 1060 | |
| 1061 if(IS_DIRECT(top_type)){ | |
| 1062 *(uint32_t*)&h->direct_cache[scan8[0] - 1*8]= 0x01010101; | |
| 1063 }else if(IS_8X8(top_type)){ | |
| 1064 int b8_xy = h->mb2b8_xy[top_xy] + h->b8_stride; | |
| 1065 h->direct_cache[scan8[0] + 0 - 1*8]= h->direct_table[b8_xy]; | |
| 1066 h->direct_cache[scan8[0] + 2 - 1*8]= h->direct_table[b8_xy + 1]; | |
| 1067 }else{ | |
| 1068 *(uint32_t*)&h->direct_cache[scan8[0] - 1*8]= 0; | |
| 1069 } | |
| 1070 | |
| 1071 if(IS_DIRECT(left_type[0])) | |
| 1072 h->direct_cache[scan8[0] - 1 + 0*8]= 1; | |
| 1073 else if(IS_8X8(left_type[0])) | |
| 1074 h->direct_cache[scan8[0] - 1 + 0*8]= h->direct_table[h->mb2b8_xy[left_xy[0]] + 1 + h->b8_stride*(left_block[0]>>1)]; | |
| 1075 else | |
| 1076 h->direct_cache[scan8[0] - 1 + 0*8]= 0; | |
| 1077 | |
| 1078 if(IS_DIRECT(left_type[1])) | |
| 1079 h->direct_cache[scan8[0] - 1 + 2*8]= 1; | |
| 1080 else if(IS_8X8(left_type[1])) | |
| 1081 h->direct_cache[scan8[0] - 1 + 2*8]= h->direct_table[h->mb2b8_xy[left_xy[1]] + 1 + h->b8_stride*(left_block[2]>>1)]; | |
| 1082 else | |
| 1083 h->direct_cache[scan8[0] - 1 + 2*8]= 0; | |
| 1084 } | |
| 1085 } | |
| 1086 | |
| 1087 if(FRAME_MBAFF){ | |
| 1088 #define MAP_MVS\ | |
| 1089 MAP_F2F(scan8[0] - 1 - 1*8, topleft_type)\ | |
| 1090 MAP_F2F(scan8[0] + 0 - 1*8, top_type)\ | |
| 1091 MAP_F2F(scan8[0] + 1 - 1*8, top_type)\ | |
| 1092 MAP_F2F(scan8[0] + 2 - 1*8, top_type)\ | |
| 1093 MAP_F2F(scan8[0] + 3 - 1*8, top_type)\ | |
| 1094 MAP_F2F(scan8[0] + 4 - 1*8, topright_type)\ | |
| 1095 MAP_F2F(scan8[0] - 1 + 0*8, left_type[0])\ | |
| 1096 MAP_F2F(scan8[0] - 1 + 1*8, left_type[0])\ | |
| 1097 MAP_F2F(scan8[0] - 1 + 2*8, left_type[1])\ | |
| 1098 MAP_F2F(scan8[0] - 1 + 3*8, left_type[1]) | |
| 1099 if(MB_FIELD){ | |
| 1100 #define MAP_F2F(idx, mb_type)\ | |
| 1101 if(!IS_INTERLACED(mb_type) && h->ref_cache[list][idx] >= 0){\ | |
| 1102 h->ref_cache[list][idx] <<= 1;\ | |
| 1103 h->mv_cache[list][idx][1] /= 2;\ | |
| 1104 h->mvd_cache[list][idx][1] /= 2;\ | |
| 1105 } | |
| 1106 MAP_MVS | |
| 1107 #undef MAP_F2F | |
| 1108 }else{ | |
| 1109 #define MAP_F2F(idx, mb_type)\ | |
| 1110 if(IS_INTERLACED(mb_type) && h->ref_cache[list][idx] >= 0){\ | |
| 1111 h->ref_cache[list][idx] >>= 1;\ | |
| 1112 h->mv_cache[list][idx][1] <<= 1;\ | |
| 1113 h->mvd_cache[list][idx][1] <<= 1;\ | |
| 1114 } | |
| 1115 MAP_MVS | |
| 1116 #undef MAP_F2F | |
| 1117 } | |
| 1118 } | |
| 1119 } | |
| 1120 } | |
| 1121 #endif | |
| 1122 | |
| 10928 | 1123 h->neighbor_transform_size= !!IS_8x8DCT(top_type) + !!IS_8x8DCT(left_type[0]); |
| 10907 | 1124 } |
| 1125 | |
| 10910 | 1126 /** |
| 1127 * | |
| 1128 * @returns non zero if the loop filter can be skiped | |
| 1129 */ | |
| 1130 static int fill_filter_caches(H264Context *h, int mb_type){ | |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1131 MpegEncContext * const s = &h->s; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1132 const int mb_xy= h->mb_xy; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1133 int top_xy, left_xy[2]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1134 int top_type, left_type[2]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1135 int i; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1136 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1137 top_xy = mb_xy - (s->mb_stride << MB_FIELD); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1138 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1139 //FIXME deblocking could skip the intra and nnz parts. |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1140 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1141 /* Wow, what a mess, why didn't they simplify the interlacing & intra |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1142 * stuff, I can't imagine that these complex rules are worth it. */ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1143 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1144 left_xy[1] = left_xy[0] = mb_xy-1; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1145 if(FRAME_MBAFF){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1146 const int left_mb_field_flag = IS_INTERLACED(s->current_picture.mb_type[mb_xy-1]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1147 const int curr_mb_field_flag = IS_INTERLACED(mb_type); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1148 if(s->mb_y&1){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1149 if (left_mb_field_flag != curr_mb_field_flag) { |
| 11023 | 1150 left_xy[0] -= s->mb_stride; |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1151 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1152 }else{ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1153 if(curr_mb_field_flag){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1154 top_xy += s->mb_stride & (((s->current_picture.mb_type[top_xy ]>>7)&1)-1); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1155 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1156 if (left_mb_field_flag != curr_mb_field_flag) { |
| 11023 | 1157 left_xy[1] += s->mb_stride; |
|
11022
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1158 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1159 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1160 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1161 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1162 h->top_mb_xy = top_xy; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1163 h->left_mb_xy[0] = left_xy[0]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1164 h->left_mb_xy[1] = left_xy[1]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1165 { |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1166 //for sufficiently low qp, filtering wouldn't do anything |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1167 //this is a conservative estimate: could also check beta_offset and more accurate chroma_qp |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1168 int qp_thresh = h->qp_thresh; //FIXME strictly we should store qp_thresh for each mb of a slice |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1169 int qp = s->current_picture.qscale_table[mb_xy]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1170 if(qp <= qp_thresh |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1171 && (left_xy[0]<0 || ((qp + s->current_picture.qscale_table[left_xy[0]] + 1)>>1) <= qp_thresh) |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1172 && (top_xy < 0 || ((qp + s->current_picture.qscale_table[top_xy ] + 1)>>1) <= qp_thresh)){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1173 if(!FRAME_MBAFF) |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1174 return 1; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1175 if( (left_xy[0]< 0 || ((qp + s->current_picture.qscale_table[left_xy[1] ] + 1)>>1) <= qp_thresh) |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1176 && (top_xy < s->mb_stride || ((qp + s->current_picture.qscale_table[top_xy -s->mb_stride] + 1)>>1) <= qp_thresh)) |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1177 return 1; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1178 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1179 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1180 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1181 if(h->deblocking_filter == 2){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1182 h->top_type = top_type = h->slice_table[top_xy ] == h->slice_num ? s->current_picture.mb_type[top_xy] : 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1183 h->left_type[0]= left_type[0] = h->slice_table[left_xy[0] ] == h->slice_num ? s->current_picture.mb_type[left_xy[0]] : 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1184 h->left_type[1]= left_type[1] = h->slice_table[left_xy[1] ] == h->slice_num ? s->current_picture.mb_type[left_xy[1]] : 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1185 }else{ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1186 h->top_type = top_type = h->slice_table[top_xy ] < 0xFFFF ? s->current_picture.mb_type[top_xy] : 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1187 h->left_type[0]= left_type[0] = h->slice_table[left_xy[0] ] < 0xFFFF ? s->current_picture.mb_type[left_xy[0]] : 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1188 h->left_type[1]= left_type[1] = h->slice_table[left_xy[1] ] < 0xFFFF ? s->current_picture.mb_type[left_xy[1]] : 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1189 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1190 if(IS_INTRA(mb_type)) |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1191 return 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1192 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1193 AV_COPY64(&h->non_zero_count_cache[0+8*1], &h->non_zero_count[mb_xy][ 0]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1194 AV_COPY64(&h->non_zero_count_cache[0+8*2], &h->non_zero_count[mb_xy][ 8]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1195 *((uint32_t*)&h->non_zero_count_cache[0+8*5])= *((uint32_t*)&h->non_zero_count[mb_xy][16]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1196 *((uint32_t*)&h->non_zero_count_cache[4+8*3])= *((uint32_t*)&h->non_zero_count[mb_xy][20]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1197 AV_COPY64(&h->non_zero_count_cache[0+8*4], &h->non_zero_count[mb_xy][24]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1198 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1199 h->cbp= h->cbp_table[mb_xy]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1200 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1201 { |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1202 int list; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1203 for(list=0; list<h->list_count; list++){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1204 int8_t *ref; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1205 int y, b_stride; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1206 int16_t (*mv_dst)[2]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1207 int16_t (*mv_src)[2]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1208 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1209 if(!USES_LIST(mb_type, list)){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1210 fill_rectangle( h->mv_cache[list][scan8[0]], 4, 4, 8, pack16to32(0,0), 4); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1211 *(uint32_t*)&h->ref_cache[list][scan8[ 0]] = |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1212 *(uint32_t*)&h->ref_cache[list][scan8[ 2]] = |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1213 *(uint32_t*)&h->ref_cache[list][scan8[ 8]] = |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1214 *(uint32_t*)&h->ref_cache[list][scan8[10]] = ((LIST_NOT_USED)&0xFF)*0x01010101; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1215 continue; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1216 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1217 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1218 ref = &s->current_picture.ref_index[list][h->mb2b8_xy[mb_xy]]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1219 { |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1220 int (*ref2frm)[64] = h->ref2frm[ h->slice_num&(MAX_SLICES-1) ][0] + (MB_MBAFF ? 20 : 2); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1221 *(uint32_t*)&h->ref_cache[list][scan8[ 0]] = |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1222 *(uint32_t*)&h->ref_cache[list][scan8[ 2]] = (pack16to32(ref2frm[list][ref[0]],ref2frm[list][ref[1]])&0x00FF00FF)*0x0101; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1223 ref += h->b8_stride; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1224 *(uint32_t*)&h->ref_cache[list][scan8[ 8]] = |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1225 *(uint32_t*)&h->ref_cache[list][scan8[10]] = (pack16to32(ref2frm[list][ref[0]],ref2frm[list][ref[1]])&0x00FF00FF)*0x0101; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1226 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1227 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1228 b_stride = h->b_stride; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1229 mv_dst = &h->mv_cache[list][scan8[0]]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1230 mv_src = &s->current_picture.motion_val[list][4*s->mb_x + 4*s->mb_y*b_stride]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1231 for(y=0; y<4; y++){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1232 AV_COPY128(mv_dst + 8*y, mv_src + y*b_stride); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1233 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1234 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1235 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1236 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1237 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1238 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1239 /* |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1240 0 . T T. T T T T |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1241 1 L . .L . . . . |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1242 2 L . .L . . . . |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1243 3 . T TL . . . . |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1244 4 L . .L . . . . |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1245 5 L . .. . . . . |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1246 */ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1247 //FIXME constraint_intra_pred & partitioning & nnz (let us hope this is just a typo in the spec) |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1248 if(top_type){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1249 *(uint32_t*)&h->non_zero_count_cache[4+8*0]= *(uint32_t*)&h->non_zero_count[top_xy][4+3*8]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1250 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1251 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1252 if(left_type[0]){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1253 h->non_zero_count_cache[3+8*1]= h->non_zero_count[left_xy[0]][7+0*8]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1254 h->non_zero_count_cache[3+8*2]= h->non_zero_count[left_xy[0]][7+1*8]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1255 h->non_zero_count_cache[3+8*3]= h->non_zero_count[left_xy[0]][7+2*8]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1256 h->non_zero_count_cache[3+8*4]= h->non_zero_count[left_xy[0]][7+3*8]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1257 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1258 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1259 // CAVLC 8x8dct requires NNZ values for residual decoding that differ from what the loop filter needs |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1260 if(!CABAC && h->pps.transform_8x8_mode){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1261 if(IS_8x8DCT(top_type)){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1262 h->non_zero_count_cache[4+8*0]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1263 h->non_zero_count_cache[5+8*0]= h->cbp_table[top_xy] & 4; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1264 h->non_zero_count_cache[6+8*0]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1265 h->non_zero_count_cache[7+8*0]= h->cbp_table[top_xy] & 8; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1266 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1267 if(IS_8x8DCT(left_type[0])){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1268 h->non_zero_count_cache[3+8*1]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1269 h->non_zero_count_cache[3+8*2]= h->cbp_table[left_xy[0]]&2; //FIXME check MBAFF |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1270 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1271 if(IS_8x8DCT(left_type[1])){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1272 h->non_zero_count_cache[3+8*3]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1273 h->non_zero_count_cache[3+8*4]= h->cbp_table[left_xy[1]]&8; //FIXME check MBAFF |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1274 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1275 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1276 if(IS_8x8DCT(mb_type)){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1277 h->non_zero_count_cache[scan8[0 ]]= h->non_zero_count_cache[scan8[1 ]]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1278 h->non_zero_count_cache[scan8[2 ]]= h->non_zero_count_cache[scan8[3 ]]= h->cbp & 1; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1279 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1280 h->non_zero_count_cache[scan8[0+ 4]]= h->non_zero_count_cache[scan8[1+ 4]]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1281 h->non_zero_count_cache[scan8[2+ 4]]= h->non_zero_count_cache[scan8[3+ 4]]= h->cbp & 2; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1282 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1283 h->non_zero_count_cache[scan8[0+ 8]]= h->non_zero_count_cache[scan8[1+ 8]]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1284 h->non_zero_count_cache[scan8[2+ 8]]= h->non_zero_count_cache[scan8[3+ 8]]= h->cbp & 4; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1285 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1286 h->non_zero_count_cache[scan8[0+12]]= h->non_zero_count_cache[scan8[1+12]]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1287 h->non_zero_count_cache[scan8[2+12]]= h->non_zero_count_cache[scan8[3+12]]= h->cbp & 8; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1288 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1289 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1290 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1291 if(IS_INTER(mb_type) || IS_DIRECT(mb_type)){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1292 int list; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1293 for(list=0; list<h->list_count; list++){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1294 if(USES_LIST(top_type, list)){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1295 const int b_xy= h->mb2b_xy[top_xy] + 3*h->b_stride; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1296 const int b8_xy= h->mb2b8_xy[top_xy] + h->b8_stride; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1297 int (*ref2frm)[64] = h->ref2frm[ h->slice_table[top_xy]&(MAX_SLICES-1) ][0] + (MB_MBAFF ? 20 : 2); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1298 AV_COPY128(h->mv_cache[list][scan8[0] + 0 - 1*8], s->current_picture.motion_val[list][b_xy + 0]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1299 h->ref_cache[list][scan8[0] + 0 - 1*8]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1300 h->ref_cache[list][scan8[0] + 1 - 1*8]= ref2frm[list][s->current_picture.ref_index[list][b8_xy + 0]]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1301 h->ref_cache[list][scan8[0] + 2 - 1*8]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1302 h->ref_cache[list][scan8[0] + 3 - 1*8]= ref2frm[list][s->current_picture.ref_index[list][b8_xy + 1]]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1303 }else{ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1304 AV_ZERO128(h->mv_cache[list][scan8[0] + 0 - 1*8]); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1305 *(uint32_t*)&h->ref_cache[list][scan8[0] + 0 - 1*8]= ((LIST_NOT_USED)&0xFF)*0x01010101; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1306 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1307 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1308 if(!IS_INTERLACED(mb_type^left_type[0])){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1309 if(USES_LIST(left_type[0], list)){ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1310 const int b_xy= h->mb2b_xy[left_xy[0]] + 3; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1311 const int b8_xy= h->mb2b8_xy[left_xy[0]] + 1; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1312 int (*ref2frm)[64] = h->ref2frm[ h->slice_table[left_xy[0]]&(MAX_SLICES-1) ][0] + (MB_MBAFF ? 20 : 2); |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1313 *(uint32_t*)h->mv_cache[list][scan8[0] - 1 + 0 ]= *(uint32_t*)s->current_picture.motion_val[list][b_xy + h->b_stride*0]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1314 *(uint32_t*)h->mv_cache[list][scan8[0] - 1 + 8 ]= *(uint32_t*)s->current_picture.motion_val[list][b_xy + h->b_stride*1]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1315 *(uint32_t*)h->mv_cache[list][scan8[0] - 1 +16 ]= *(uint32_t*)s->current_picture.motion_val[list][b_xy + h->b_stride*2]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1316 *(uint32_t*)h->mv_cache[list][scan8[0] - 1 +24 ]= *(uint32_t*)s->current_picture.motion_val[list][b_xy + h->b_stride*3]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1317 h->ref_cache[list][scan8[0] - 1 + 0 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1318 h->ref_cache[list][scan8[0] - 1 + 8 ]= ref2frm[list][s->current_picture.ref_index[list][b8_xy + h->b8_stride*0]]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1319 h->ref_cache[list][scan8[0] - 1 +16 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1320 h->ref_cache[list][scan8[0] - 1 +24 ]= ref2frm[list][s->current_picture.ref_index[list][b8_xy + h->b8_stride*1]]; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1321 }else{ |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1322 *(uint32_t*)h->mv_cache [list][scan8[0] - 1 + 0 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1323 *(uint32_t*)h->mv_cache [list][scan8[0] - 1 + 8 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1324 *(uint32_t*)h->mv_cache [list][scan8[0] - 1 +16 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1325 *(uint32_t*)h->mv_cache [list][scan8[0] - 1 +24 ]= 0; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1326 h->ref_cache[list][scan8[0] - 1 + 0 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1327 h->ref_cache[list][scan8[0] - 1 + 8 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1328 h->ref_cache[list][scan8[0] - 1 + 16 ]= |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1329 h->ref_cache[list][scan8[0] - 1 + 24 ]= LIST_NOT_USED; |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1330 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1331 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1332 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1333 } |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1334 |
|
44529d4292ce
Split fill_caches() between loopfilter & decode, the 2 no longer where common
michael
parents:
11020
diff
changeset
|
1335 return 0; |
| 10907 | 1336 } |
| 1337 | |
| 10866 | 1338 /** |
| 1339 * gets the predicted intra4x4 prediction mode. | |
| 1340 */ | |
| 1341 static inline int pred_intra_mode(H264Context *h, int n){ | |
| 1342 const int index8= scan8[n]; | |
| 1343 const int left= h->intra4x4_pred_mode_cache[index8 - 1]; | |
| 1344 const int top = h->intra4x4_pred_mode_cache[index8 - 8]; | |
| 1345 const int min= FFMIN(left, top); | |
| 1346 | |
| 1347 tprintf(h->s.avctx, "mode:%d %d min:%d\n", left ,top, min); | |
| 1348 | |
| 1349 if(min<0) return DC_PRED; | |
| 1350 else return min; | |
| 1351 } | |
| 1352 | |
| 1353 static inline void write_back_non_zero_count(H264Context *h){ | |
| 1354 const int mb_xy= h->mb_xy; | |
| 1355 | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1356 AV_COPY64(&h->non_zero_count[mb_xy][ 0], &h->non_zero_count_cache[0+8*1]); |
|
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1357 AV_COPY64(&h->non_zero_count[mb_xy][ 8], &h->non_zero_count_cache[0+8*2]); |
|
10909
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
1358 *((uint32_t*)&h->non_zero_count[mb_xy][16]) = *((uint32_t*)&h->non_zero_count_cache[0+8*5]); |
|
f4cf3960b8c6
Reorganize how values are stored in h->non_zero_count.
michael
parents:
10908
diff
changeset
|
1359 *((uint32_t*)&h->non_zero_count[mb_xy][20]) = *((uint32_t*)&h->non_zero_count_cache[4+8*3]); |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1360 AV_COPY64(&h->non_zero_count[mb_xy][24], &h->non_zero_count_cache[0+8*4]); |
| 10866 | 1361 } |
| 1362 | |
| 1363 static inline void write_back_motion(H264Context *h, int mb_type){ | |
| 1364 MpegEncContext * const s = &h->s; | |
| 1365 const int b_xy = 4*s->mb_x + 4*s->mb_y*h->b_stride; | |
| 1366 const int b8_xy= 2*s->mb_x + 2*s->mb_y*h->b8_stride; | |
| 1367 int list; | |
| 1368 | |
| 1369 if(!USES_LIST(mb_type, 0)) | |
| 1370 fill_rectangle(&s->current_picture.ref_index[0][b8_xy], 2, 2, h->b8_stride, (uint8_t)LIST_NOT_USED, 1); | |
| 1371 | |
| 1372 for(list=0; list<h->list_count; list++){ | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1373 int y, b_stride; |
|
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1374 int16_t (*mv_dst)[2]; |
|
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1375 int16_t (*mv_src)[2]; |
|
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1376 |
| 10866 | 1377 if(!USES_LIST(mb_type, list)) |
| 1378 continue; | |
| 1379 | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1380 b_stride = h->b_stride; |
|
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1381 mv_dst = &s->current_picture.motion_val[list][b_xy]; |
|
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1382 mv_src = &h->mv_cache[list][scan8[0]]; |
| 10866 | 1383 for(y=0; y<4; y++){ |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1384 AV_COPY128(mv_dst + y*b_stride, mv_src + 8*y); |
| 10866 | 1385 } |
|
10893
2aafcafbe1f0
Replace cabac checks in inline functions from h264.h with constants.
michael
parents:
10883
diff
changeset
|
1386 if( CABAC ) { |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1387 int16_t (*mvd_dst)[2] = &h->mvd_table[list][b_xy]; |
|
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1388 int16_t (*mvd_src)[2] = &h->mvd_cache[list][scan8[0]]; |
| 10866 | 1389 if(IS_SKIP(mb_type)) |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1390 fill_rectangle(mvd_dst, 4, 4, h->b_stride, 0, 4); |
| 10866 | 1391 else |
| 1392 for(y=0; y<4; y++){ | |
|
11002
1c8892d7a090
H.264: Use 64-/128-bit write-combining macros for copies
astrange
parents:
10987
diff
changeset
|
1393 AV_COPY128(mvd_dst + y*b_stride, mvd_src + 8*y); |
| 10866 | 1394 } |
| 1395 } | |
| 1396 | |
| 1397 { | |
| 1398 int8_t *ref_index = &s->current_picture.ref_index[list][b8_xy]; | |
| 1399 ref_index[0+0*h->b8_stride]= h->ref_cache[list][scan8[0]]; | |
| 1400 ref_index[1+0*h->b8_stride]= h->ref_cache[list][scan8[4]]; | |
| 1401 ref_index[0+1*h->b8_stride]= h->ref_cache[list][scan8[8]]; | |
| 1402 ref_index[1+1*h->b8_stride]= h->ref_cache[list][scan8[12]]; | |
| 1403 } | |
| 1404 } | |
| 1405 | |
|
10893
2aafcafbe1f0
Replace cabac checks in inline functions from h264.h with constants.
michael
parents:
10883
diff
changeset
|
1406 if(h->slice_type_nos == FF_B_TYPE && CABAC){ |
| 10866 | 1407 if(IS_8X8(mb_type)){ |
| 1408 uint8_t *direct_table = &h->direct_table[b8_xy]; | |
| 1409 direct_table[1+0*h->b8_stride] = IS_DIRECT(h->sub_mb_type[1]) ? 1 : 0; | |
| 1410 direct_table[0+1*h->b8_stride] = IS_DIRECT(h->sub_mb_type[2]) ? 1 : 0; | |
| 1411 direct_table[1+1*h->b8_stride] = IS_DIRECT(h->sub_mb_type[3]) ? 1 : 0; | |
| 1412 } | |
| 1413 } | |
| 1414 } | |
| 1415 | |
| 1416 static inline int get_dct8x8_allowed(H264Context *h){ | |
| 1417 if(h->sps.direct_8x8_inference_flag) | |
| 1418 return !(*(uint64_t*)h->sub_mb_type & ((MB_TYPE_16x8|MB_TYPE_8x16|MB_TYPE_8x8 )*0x0001000100010001ULL)); | |
| 1419 else | |
| 1420 return !(*(uint64_t*)h->sub_mb_type & ((MB_TYPE_16x8|MB_TYPE_8x16|MB_TYPE_8x8|MB_TYPE_DIRECT2)*0x0001000100010001ULL)); | |
| 1421 } | |
| 1422 | |
| 1423 static void predict_field_decoding_flag(H264Context *h){ | |
| 1424 MpegEncContext * const s = &h->s; | |
| 1425 const int mb_xy= h->mb_xy; | |
| 1426 int mb_type = (h->slice_table[mb_xy-1] == h->slice_num) | |
| 1427 ? s->current_picture.mb_type[mb_xy-1] | |
| 1428 : (h->slice_table[mb_xy-s->mb_stride] == h->slice_num) | |
| 1429 ? s->current_picture.mb_type[mb_xy-s->mb_stride] | |
| 1430 : 0; | |
| 1431 h->mb_mbaff = h->mb_field_decoding_flag = IS_INTERLACED(mb_type) ? 1 : 0; | |
| 1432 } | |
| 1433 | |
| 1434 /** | |
| 1435 * decodes a P_SKIP or B_SKIP macroblock | |
| 1436 */ | |
| 1437 static void decode_mb_skip(H264Context *h){ | |
| 1438 MpegEncContext * const s = &h->s; | |
| 1439 const int mb_xy= h->mb_xy; | |
| 1440 int mb_type=0; | |
| 1441 | |
| 10906 | 1442 memset(h->non_zero_count[mb_xy], 0, 32); |
| 10866 | 1443 memset(h->non_zero_count_cache + 8, 0, 8*5); //FIXME ugly, remove pfui |
| 1444 | |
| 1445 if(MB_FIELD) | |
| 1446 mb_type|= MB_TYPE_INTERLACED; | |
| 1447 | |
| 1448 if( h->slice_type_nos == FF_B_TYPE ) | |
| 1449 { | |
| 1450 // just for fill_caches. pred_direct_motion will set the real mb_type | |
| 1451 mb_type|= MB_TYPE_P0L0|MB_TYPE_P0L1|MB_TYPE_DIRECT2|MB_TYPE_SKIP; | |
| 1452 | |
| 10907 | 1453 fill_decode_caches(h, mb_type); //FIXME check what is needed and what not ... |
| 10866 | 1454 ff_h264_pred_direct_motion(h, &mb_type); |
| 1455 mb_type|= MB_TYPE_SKIP; | |
| 1456 } | |
| 1457 else | |
| 1458 { | |
| 1459 int mx, my; | |
| 1460 mb_type|= MB_TYPE_16x16|MB_TYPE_P0L0|MB_TYPE_P1L0|MB_TYPE_SKIP; | |
| 1461 | |
| 10907 | 1462 fill_decode_caches(h, mb_type); //FIXME check what is needed and what not ... |
| 10866 | 1463 pred_pskip_motion(h, &mx, &my); |
| 1464 fill_rectangle(&h->ref_cache[0][scan8[0]], 4, 4, 8, 0, 1); | |
| 1465 fill_rectangle( h->mv_cache[0][scan8[0]], 4, 4, 8, pack16to32(mx,my), 4); | |
| 1466 } | |
| 1467 | |
| 1468 write_back_motion(h, mb_type); | |
| 1469 s->current_picture.mb_type[mb_xy]= mb_type; | |
| 1470 s->current_picture.qscale_table[mb_xy]= s->qscale; | |
| 1471 h->slice_table[ mb_xy ]= h->slice_num; | |
| 1472 h->prev_mb_skipped= 1; | |
| 1473 } | |
| 1474 | |
|
10883
4701b9355d93
Add forgotten include of h264_mvpred.h to h264.h.
michael
parents:
10869
diff
changeset
|
1475 #include "h264_mvpred.h" //For pred_pskip_motion() |
|
4701b9355d93
Add forgotten include of h264_mvpred.h to h264.h.
michael
parents:
10869
diff
changeset
|
1476 |
| 7760 | 1477 #endif /* AVCODEC_H264_H */ |
