blob: 7e66ed72247c5ab9f36d09dc9f1d505e57763eeb
1 | /* |
2 | * H.26L/H.264/AVC/JVT/14496-10/... parameter set decoding |
3 | * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at> |
4 | * |
5 | * This file is part of FFmpeg. |
6 | * |
7 | * FFmpeg is free software; you can redistribute it and/or |
8 | * modify it under the terms of the GNU Lesser General Public |
9 | * License as published by the Free Software Foundation; either |
10 | * version 2.1 of the License, or (at your option) any later version. |
11 | * |
12 | * FFmpeg is distributed in the hope that it will be useful, |
13 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
14 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
15 | * Lesser General Public License for more details. |
16 | * |
17 | * You should have received a copy of the GNU Lesser General Public |
18 | * License along with FFmpeg; if not, write to the Free Software |
19 | * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
20 | */ |
21 | |
22 | /** |
23 | * @file |
24 | * H.264 / AVC / MPEG-4 part10 parameter set decoding. |
25 | * @author Michael Niedermayer <michaelni@gmx.at> |
26 | */ |
27 | |
28 | #include <inttypes.h> |
29 | |
30 | #include "libavutil/imgutils.h" |
31 | #include "internal.h" |
32 | #include "mathops.h" |
33 | #include "avcodec.h" |
34 | #include "h264data.h" |
35 | #include "h264_ps.h" |
36 | #include "golomb.h" |
37 | |
38 | #define MAX_LOG2_MAX_FRAME_NUM (12 + 4) |
39 | #define MIN_LOG2_MAX_FRAME_NUM 4 |
40 | |
41 | #define EXTENDED_SAR 255 |
42 | |
43 | static const uint8_t default_scaling4[2][16] = { |
44 | { 6, 13, 20, 28, 13, 20, 28, 32, |
45 | 20, 28, 32, 37, 28, 32, 37, 42 }, |
46 | { 10, 14, 20, 24, 14, 20, 24, 27, |
47 | 20, 24, 27, 30, 24, 27, 30, 34 } |
48 | }; |
49 | |
50 | static const uint8_t default_scaling8[2][64] = { |
51 | { 6, 10, 13, 16, 18, 23, 25, 27, |
52 | 10, 11, 16, 18, 23, 25, 27, 29, |
53 | 13, 16, 18, 23, 25, 27, 29, 31, |
54 | 16, 18, 23, 25, 27, 29, 31, 33, |
55 | 18, 23, 25, 27, 29, 31, 33, 36, |
56 | 23, 25, 27, 29, 31, 33, 36, 38, |
57 | 25, 27, 29, 31, 33, 36, 38, 40, |
58 | 27, 29, 31, 33, 36, 38, 40, 42 }, |
59 | { 9, 13, 15, 17, 19, 21, 22, 24, |
60 | 13, 13, 17, 19, 21, 22, 24, 25, |
61 | 15, 17, 19, 21, 22, 24, 25, 27, |
62 | 17, 19, 21, 22, 24, 25, 27, 28, |
63 | 19, 21, 22, 24, 25, 27, 28, 30, |
64 | 21, 22, 24, 25, 27, 28, 30, 32, |
65 | 22, 24, 25, 27, 28, 30, 32, 33, |
66 | 24, 25, 27, 28, 30, 32, 33, 35 } |
67 | }; |
68 | |
69 | /* maximum number of MBs in the DPB for a given level */ |
70 | static const int level_max_dpb_mbs[][2] = { |
71 | { 10, 396 }, |
72 | { 11, 900 }, |
73 | { 12, 2376 }, |
74 | { 13, 2376 }, |
75 | { 20, 2376 }, |
76 | { 21, 4752 }, |
77 | { 22, 8100 }, |
78 | { 30, 8100 }, |
79 | { 31, 18000 }, |
80 | { 32, 20480 }, |
81 | { 40, 32768 }, |
82 | { 41, 32768 }, |
83 | { 42, 34816 }, |
84 | { 50, 110400 }, |
85 | { 51, 184320 }, |
86 | { 52, 184320 }, |
87 | }; |
88 | |
89 | static void remove_pps(H264ParamSets *s, int id) |
90 | { |
91 | av_buffer_unref(&s->pps_list[id]); |
92 | } |
93 | |
94 | static void remove_sps(H264ParamSets *s, int id) |
95 | { |
96 | #if 0 |
97 | int i; |
98 | if (s->sps_list[id]) { |
99 | /* drop all PPS that depend on this SPS */ |
100 | for (i = 0; i < FF_ARRAY_ELEMS(s->pps_list); i++) |
101 | if (s->pps_list[i] && ((PPS*)s->pps_list[i]->data)->sps_id == id) |
102 | remove_pps(s, i); |
103 | } |
104 | #endif |
105 | av_buffer_unref(&s->sps_list[id]); |
106 | } |
107 | |
108 | static inline int decode_hrd_parameters(GetBitContext *gb, AVCodecContext *avctx, |
109 | SPS *sps) |
110 | { |
111 | int cpb_count, i; |
112 | cpb_count = get_ue_golomb_31(gb) + 1; |
113 | |
114 | if (cpb_count > 32U) { |
115 | av_log(avctx, AV_LOG_ERROR, "cpb_count %d invalid\n", cpb_count); |
116 | return AVERROR_INVALIDDATA; |
117 | } |
118 | |
119 | get_bits(gb, 4); /* bit_rate_scale */ |
120 | get_bits(gb, 4); /* cpb_size_scale */ |
121 | for (i = 0; i < cpb_count; i++) { |
122 | get_ue_golomb_long(gb); /* bit_rate_value_minus1 */ |
123 | get_ue_golomb_long(gb); /* cpb_size_value_minus1 */ |
124 | get_bits1(gb); /* cbr_flag */ |
125 | } |
126 | sps->initial_cpb_removal_delay_length = get_bits(gb, 5) + 1; |
127 | sps->cpb_removal_delay_length = get_bits(gb, 5) + 1; |
128 | sps->dpb_output_delay_length = get_bits(gb, 5) + 1; |
129 | sps->time_offset_length = get_bits(gb, 5); |
130 | sps->cpb_cnt = cpb_count; |
131 | return 0; |
132 | } |
133 | |
134 | static inline int decode_vui_parameters(GetBitContext *gb, AVCodecContext *avctx, |
135 | SPS *sps) |
136 | { |
137 | int aspect_ratio_info_present_flag; |
138 | unsigned int aspect_ratio_idc; |
139 | |
140 | aspect_ratio_info_present_flag = get_bits1(gb); |
141 | |
142 | if (aspect_ratio_info_present_flag) { |
143 | aspect_ratio_idc = get_bits(gb, 8); |
144 | if (aspect_ratio_idc == EXTENDED_SAR) { |
145 | sps->sar.num = get_bits(gb, 16); |
146 | sps->sar.den = get_bits(gb, 16); |
147 | } else if (aspect_ratio_idc < FF_ARRAY_ELEMS(ff_h264_pixel_aspect)) { |
148 | sps->sar = ff_h264_pixel_aspect[aspect_ratio_idc]; |
149 | } else { |
150 | av_log(avctx, AV_LOG_ERROR, "illegal aspect ratio\n"); |
151 | return AVERROR_INVALIDDATA; |
152 | } |
153 | } else { |
154 | sps->sar.num = |
155 | sps->sar.den = 0; |
156 | } |
157 | |
158 | if (get_bits1(gb)) /* overscan_info_present_flag */ |
159 | get_bits1(gb); /* overscan_appropriate_flag */ |
160 | |
161 | sps->video_signal_type_present_flag = get_bits1(gb); |
162 | if (sps->video_signal_type_present_flag) { |
163 | get_bits(gb, 3); /* video_format */ |
164 | sps->full_range = get_bits1(gb); /* video_full_range_flag */ |
165 | |
166 | sps->colour_description_present_flag = get_bits1(gb); |
167 | if (sps->colour_description_present_flag) { |
168 | sps->color_primaries = get_bits(gb, 8); /* colour_primaries */ |
169 | sps->color_trc = get_bits(gb, 8); /* transfer_characteristics */ |
170 | sps->colorspace = get_bits(gb, 8); /* matrix_coefficients */ |
171 | if (sps->color_primaries >= AVCOL_PRI_NB) |
172 | sps->color_primaries = AVCOL_PRI_UNSPECIFIED; |
173 | if (sps->color_trc >= AVCOL_TRC_NB) |
174 | sps->color_trc = AVCOL_TRC_UNSPECIFIED; |
175 | if (sps->colorspace >= AVCOL_SPC_NB) |
176 | sps->colorspace = AVCOL_SPC_UNSPECIFIED; |
177 | } |
178 | } |
179 | |
180 | /* chroma_location_info_present_flag */ |
181 | if (get_bits1(gb)) { |
182 | /* chroma_sample_location_type_top_field */ |
183 | avctx->chroma_sample_location = get_ue_golomb(gb) + 1; |
184 | get_ue_golomb(gb); /* chroma_sample_location_type_bottom_field */ |
185 | } |
186 | |
187 | if (show_bits1(gb) && get_bits_left(gb) < 10) { |
188 | av_log(avctx, AV_LOG_WARNING, "Truncated VUI\n"); |
189 | return 0; |
190 | } |
191 | |
192 | sps->timing_info_present_flag = get_bits1(gb); |
193 | if (sps->timing_info_present_flag) { |
194 | unsigned num_units_in_tick = get_bits_long(gb, 32); |
195 | unsigned time_scale = get_bits_long(gb, 32); |
196 | if (!num_units_in_tick || !time_scale) { |
197 | av_log(avctx, AV_LOG_ERROR, |
198 | "time_scale/num_units_in_tick invalid or unsupported (%u/%u)\n", |
199 | time_scale, num_units_in_tick); |
200 | sps->timing_info_present_flag = 0; |
201 | } else { |
202 | sps->num_units_in_tick = num_units_in_tick; |
203 | sps->time_scale = time_scale; |
204 | } |
205 | sps->fixed_frame_rate_flag = get_bits1(gb); |
206 | } |
207 | |
208 | sps->nal_hrd_parameters_present_flag = get_bits1(gb); |
209 | if (sps->nal_hrd_parameters_present_flag) |
210 | if (decode_hrd_parameters(gb, avctx, sps) < 0) |
211 | return AVERROR_INVALIDDATA; |
212 | sps->vcl_hrd_parameters_present_flag = get_bits1(gb); |
213 | if (sps->vcl_hrd_parameters_present_flag) |
214 | if (decode_hrd_parameters(gb, avctx, sps) < 0) |
215 | return AVERROR_INVALIDDATA; |
216 | if (sps->nal_hrd_parameters_present_flag || |
217 | sps->vcl_hrd_parameters_present_flag) |
218 | get_bits1(gb); /* low_delay_hrd_flag */ |
219 | sps->pic_struct_present_flag = get_bits1(gb); |
220 | if (!get_bits_left(gb)) |
221 | return 0; |
222 | sps->bitstream_restriction_flag = get_bits1(gb); |
223 | if (sps->bitstream_restriction_flag) { |
224 | get_bits1(gb); /* motion_vectors_over_pic_boundaries_flag */ |
225 | get_ue_golomb(gb); /* max_bytes_per_pic_denom */ |
226 | get_ue_golomb(gb); /* max_bits_per_mb_denom */ |
227 | get_ue_golomb(gb); /* log2_max_mv_length_horizontal */ |
228 | get_ue_golomb(gb); /* log2_max_mv_length_vertical */ |
229 | sps->num_reorder_frames = get_ue_golomb(gb); |
230 | get_ue_golomb(gb); /*max_dec_frame_buffering*/ |
231 | |
232 | if (get_bits_left(gb) < 0) { |
233 | sps->num_reorder_frames = 0; |
234 | sps->bitstream_restriction_flag = 0; |
235 | } |
236 | |
237 | if (sps->num_reorder_frames > 16U |
238 | /* max_dec_frame_buffering || max_dec_frame_buffering > 16 */) { |
239 | av_log(avctx, AV_LOG_ERROR, |
240 | "Clipping illegal num_reorder_frames %d\n", |
241 | sps->num_reorder_frames); |
242 | sps->num_reorder_frames = 16; |
243 | return AVERROR_INVALIDDATA; |
244 | } |
245 | } |
246 | |
247 | return 0; |
248 | } |
249 | |
250 | static int decode_scaling_list(GetBitContext *gb, uint8_t *factors, int size, |
251 | const uint8_t *jvt_list, |
252 | const uint8_t *fallback_list) |
253 | { |
254 | int i, last = 8, next = 8; |
255 | const uint8_t *scan = size == 16 ? ff_zigzag_scan : ff_zigzag_direct; |
256 | if (!get_bits1(gb)) /* matrix not written, we use the predicted one */ |
257 | memcpy(factors, fallback_list, size * sizeof(uint8_t)); |
258 | else |
259 | for (i = 0; i < size; i++) { |
260 | if (next) { |
261 | int v = get_se_golomb(gb); |
262 | if (v < -128 || v > 127) { |
263 | av_log(NULL, AV_LOG_ERROR, "delta scale %d is invalid\n", v); |
264 | return AVERROR_INVALIDDATA; |
265 | } |
266 | next = (last + v) & 0xff; |
267 | } |
268 | if (!i && !next) { /* matrix not written, we use the preset one */ |
269 | memcpy(factors, jvt_list, size * sizeof(uint8_t)); |
270 | break; |
271 | } |
272 | last = factors[scan[i]] = next ? next : last; |
273 | } |
274 | return 0; |
275 | } |
276 | |
277 | /* returns non zero if the provided SPS scaling matrix has been filled */ |
278 | static int decode_scaling_matrices(GetBitContext *gb, const SPS *sps, |
279 | const PPS *pps, int is_sps, |
280 | uint8_t(*scaling_matrix4)[16], |
281 | uint8_t(*scaling_matrix8)[64]) |
282 | { |
283 | int fallback_sps = !is_sps && sps->scaling_matrix_present; |
284 | const uint8_t *fallback[4] = { |
285 | fallback_sps ? sps->scaling_matrix4[0] : default_scaling4[0], |
286 | fallback_sps ? sps->scaling_matrix4[3] : default_scaling4[1], |
287 | fallback_sps ? sps->scaling_matrix8[0] : default_scaling8[0], |
288 | fallback_sps ? sps->scaling_matrix8[3] : default_scaling8[1] |
289 | }; |
290 | int ret = 0; |
291 | if (get_bits1(gb)) { |
292 | ret |= decode_scaling_list(gb, scaling_matrix4[0], 16, default_scaling4[0], fallback[0]); // Intra, Y |
293 | ret |= decode_scaling_list(gb, scaling_matrix4[1], 16, default_scaling4[0], scaling_matrix4[0]); // Intra, Cr |
294 | ret |= decode_scaling_list(gb, scaling_matrix4[2], 16, default_scaling4[0], scaling_matrix4[1]); // Intra, Cb |
295 | ret |= decode_scaling_list(gb, scaling_matrix4[3], 16, default_scaling4[1], fallback[1]); // Inter, Y |
296 | ret |= decode_scaling_list(gb, scaling_matrix4[4], 16, default_scaling4[1], scaling_matrix4[3]); // Inter, Cr |
297 | ret |= decode_scaling_list(gb, scaling_matrix4[5], 16, default_scaling4[1], scaling_matrix4[4]); // Inter, Cb |
298 | if (is_sps || pps->transform_8x8_mode) { |
299 | ret |= decode_scaling_list(gb, scaling_matrix8[0], 64, default_scaling8[0], fallback[2]); // Intra, Y |
300 | ret |= decode_scaling_list(gb, scaling_matrix8[3], 64, default_scaling8[1], fallback[3]); // Inter, Y |
301 | if (sps->chroma_format_idc == 3) { |
302 | ret |= decode_scaling_list(gb, scaling_matrix8[1], 64, default_scaling8[0], scaling_matrix8[0]); // Intra, Cr |
303 | ret |= decode_scaling_list(gb, scaling_matrix8[4], 64, default_scaling8[1], scaling_matrix8[3]); // Inter, Cr |
304 | ret |= decode_scaling_list(gb, scaling_matrix8[2], 64, default_scaling8[0], scaling_matrix8[1]); // Intra, Cb |
305 | ret |= decode_scaling_list(gb, scaling_matrix8[5], 64, default_scaling8[1], scaling_matrix8[4]); // Inter, Cb |
306 | } |
307 | } |
308 | if (!ret) |
309 | ret = is_sps; |
310 | } |
311 | |
312 | return ret; |
313 | } |
314 | |
315 | void ff_h264_ps_uninit(H264ParamSets *ps) |
316 | { |
317 | int i; |
318 | |
319 | for (i = 0; i < MAX_SPS_COUNT; i++) |
320 | av_buffer_unref(&ps->sps_list[i]); |
321 | |
322 | for (i = 0; i < MAX_PPS_COUNT; i++) |
323 | av_buffer_unref(&ps->pps_list[i]); |
324 | |
325 | av_buffer_unref(&ps->sps_ref); |
326 | av_buffer_unref(&ps->pps_ref); |
327 | |
328 | ps->pps = NULL; |
329 | ps->sps = NULL; |
330 | } |
331 | |
332 | int ff_h264_decode_seq_parameter_set(GetBitContext *gb, AVCodecContext *avctx, |
333 | H264ParamSets *ps, int ignore_truncation) |
334 | { |
335 | AVBufferRef *sps_buf; |
336 | int profile_idc, level_idc, constraint_set_flags = 0; |
337 | unsigned int sps_id; |
338 | int i, log2_max_frame_num_minus4; |
339 | SPS *sps; |
340 | int ret; |
341 | |
342 | sps_buf = av_buffer_allocz(sizeof(*sps)); |
343 | if (!sps_buf) |
344 | return AVERROR(ENOMEM); |
345 | sps = (SPS*)sps_buf->data; |
346 | |
347 | sps->data_size = gb->buffer_end - gb->buffer; |
348 | if (sps->data_size > sizeof(sps->data)) { |
349 | av_log(avctx, AV_LOG_WARNING, "Truncating likely oversized SPS\n"); |
350 | sps->data_size = sizeof(sps->data); |
351 | } |
352 | memcpy(sps->data, gb->buffer, sps->data_size); |
353 | |
354 | profile_idc = get_bits(gb, 8); |
355 | constraint_set_flags |= get_bits1(gb) << 0; // constraint_set0_flag |
356 | constraint_set_flags |= get_bits1(gb) << 1; // constraint_set1_flag |
357 | constraint_set_flags |= get_bits1(gb) << 2; // constraint_set2_flag |
358 | constraint_set_flags |= get_bits1(gb) << 3; // constraint_set3_flag |
359 | constraint_set_flags |= get_bits1(gb) << 4; // constraint_set4_flag |
360 | constraint_set_flags |= get_bits1(gb) << 5; // constraint_set5_flag |
361 | skip_bits(gb, 2); // reserved_zero_2bits |
362 | level_idc = get_bits(gb, 8); |
363 | sps_id = get_ue_golomb_31(gb); |
364 | |
365 | if (sps_id >= MAX_SPS_COUNT) { |
366 | av_log(avctx, AV_LOG_ERROR, "sps_id %u out of range\n", sps_id); |
367 | goto fail; |
368 | } |
369 | |
370 | sps->sps_id = sps_id; |
371 | sps->time_offset_length = 24; |
372 | sps->profile_idc = profile_idc; |
373 | sps->constraint_set_flags = constraint_set_flags; |
374 | sps->level_idc = level_idc; |
375 | sps->full_range = -1; |
376 | |
377 | memset(sps->scaling_matrix4, 16, sizeof(sps->scaling_matrix4)); |
378 | memset(sps->scaling_matrix8, 16, sizeof(sps->scaling_matrix8)); |
379 | sps->scaling_matrix_present = 0; |
380 | sps->colorspace = 2; //AVCOL_SPC_UNSPECIFIED |
381 | |
382 | if (sps->profile_idc == 100 || // High profile |
383 | sps->profile_idc == 110 || // High10 profile |
384 | sps->profile_idc == 122 || // High422 profile |
385 | sps->profile_idc == 244 || // High444 Predictive profile |
386 | sps->profile_idc == 44 || // Cavlc444 profile |
387 | sps->profile_idc == 83 || // Scalable Constrained High profile (SVC) |
388 | sps->profile_idc == 86 || // Scalable High Intra profile (SVC) |
389 | sps->profile_idc == 118 || // Stereo High profile (MVC) |
390 | sps->profile_idc == 128 || // Multiview High profile (MVC) |
391 | sps->profile_idc == 138 || // Multiview Depth High profile (MVCD) |
392 | sps->profile_idc == 144) { // old High444 profile |
393 | sps->chroma_format_idc = get_ue_golomb_31(gb); |
394 | if (sps->chroma_format_idc > 3U) { |
395 | avpriv_request_sample(avctx, "chroma_format_idc %u", |
396 | sps->chroma_format_idc); |
397 | goto fail; |
398 | } else if (sps->chroma_format_idc == 3) { |
399 | sps->residual_color_transform_flag = get_bits1(gb); |
400 | if (sps->residual_color_transform_flag) { |
401 | av_log(avctx, AV_LOG_ERROR, "separate color planes are not supported\n"); |
402 | goto fail; |
403 | } |
404 | } |
405 | sps->bit_depth_luma = get_ue_golomb(gb) + 8; |
406 | sps->bit_depth_chroma = get_ue_golomb(gb) + 8; |
407 | if (sps->bit_depth_chroma != sps->bit_depth_luma) { |
408 | avpriv_request_sample(avctx, |
409 | "Different chroma and luma bit depth"); |
410 | goto fail; |
411 | } |
412 | if (sps->bit_depth_luma < 8 || sps->bit_depth_luma > 14 || |
413 | sps->bit_depth_chroma < 8 || sps->bit_depth_chroma > 14) { |
414 | av_log(avctx, AV_LOG_ERROR, "illegal bit depth value (%d, %d)\n", |
415 | sps->bit_depth_luma, sps->bit_depth_chroma); |
416 | goto fail; |
417 | } |
418 | sps->transform_bypass = get_bits1(gb); |
419 | ret = decode_scaling_matrices(gb, sps, NULL, 1, |
420 | sps->scaling_matrix4, sps->scaling_matrix8); |
421 | if (ret < 0) |
422 | goto fail; |
423 | sps->scaling_matrix_present |= ret; |
424 | } else { |
425 | sps->chroma_format_idc = 1; |
426 | sps->bit_depth_luma = 8; |
427 | sps->bit_depth_chroma = 8; |
428 | } |
429 | |
430 | log2_max_frame_num_minus4 = get_ue_golomb(gb); |
431 | if (log2_max_frame_num_minus4 < MIN_LOG2_MAX_FRAME_NUM - 4 || |
432 | log2_max_frame_num_minus4 > MAX_LOG2_MAX_FRAME_NUM - 4) { |
433 | av_log(avctx, AV_LOG_ERROR, |
434 | "log2_max_frame_num_minus4 out of range (0-12): %d\n", |
435 | log2_max_frame_num_minus4); |
436 | goto fail; |
437 | } |
438 | sps->log2_max_frame_num = log2_max_frame_num_minus4 + 4; |
439 | |
440 | sps->poc_type = get_ue_golomb_31(gb); |
441 | |
442 | if (sps->poc_type == 0) { // FIXME #define |
443 | unsigned t = get_ue_golomb(gb); |
444 | if (t>12) { |
445 | av_log(avctx, AV_LOG_ERROR, "log2_max_poc_lsb (%d) is out of range\n", t); |
446 | goto fail; |
447 | } |
448 | sps->log2_max_poc_lsb = t + 4; |
449 | } else if (sps->poc_type == 1) { // FIXME #define |
450 | sps->delta_pic_order_always_zero_flag = get_bits1(gb); |
451 | sps->offset_for_non_ref_pic = get_se_golomb(gb); |
452 | sps->offset_for_top_to_bottom_field = get_se_golomb(gb); |
453 | sps->poc_cycle_length = get_ue_golomb(gb); |
454 | |
455 | if ((unsigned)sps->poc_cycle_length >= |
456 | FF_ARRAY_ELEMS(sps->offset_for_ref_frame)) { |
457 | av_log(avctx, AV_LOG_ERROR, |
458 | "poc_cycle_length overflow %d\n", sps->poc_cycle_length); |
459 | goto fail; |
460 | } |
461 | |
462 | for (i = 0; i < sps->poc_cycle_length; i++) |
463 | sps->offset_for_ref_frame[i] = get_se_golomb(gb); |
464 | } else if (sps->poc_type != 2) { |
465 | av_log(avctx, AV_LOG_ERROR, "illegal POC type %d\n", sps->poc_type); |
466 | goto fail; |
467 | } |
468 | |
469 | sps->ref_frame_count = get_ue_golomb_31(gb); |
470 | if (avctx->codec_tag == MKTAG('S', 'M', 'V', '2')) |
471 | sps->ref_frame_count = FFMAX(2, sps->ref_frame_count); |
472 | if (sps->ref_frame_count > MAX_DELAYED_PIC_COUNT) { |
473 | av_log(avctx, AV_LOG_ERROR, |
474 | "too many reference frames %d\n", sps->ref_frame_count); |
475 | goto fail; |
476 | } |
477 | sps->gaps_in_frame_num_allowed_flag = get_bits1(gb); |
478 | sps->mb_width = get_ue_golomb(gb) + 1; |
479 | sps->mb_height = get_ue_golomb(gb) + 1; |
480 | |
481 | sps->frame_mbs_only_flag = get_bits1(gb); |
482 | |
483 | if (sps->mb_height >= INT_MAX / 2U) { |
484 | av_log(avctx, AV_LOG_ERROR, "height overflow\n"); |
485 | goto fail; |
486 | } |
487 | sps->mb_height *= 2 - sps->frame_mbs_only_flag; |
488 | |
489 | if (!sps->frame_mbs_only_flag) |
490 | sps->mb_aff = get_bits1(gb); |
491 | else |
492 | sps->mb_aff = 0; |
493 | |
494 | if ((unsigned)sps->mb_width >= INT_MAX / 16 || |
495 | (unsigned)sps->mb_height >= INT_MAX / 16 || |
496 | av_image_check_size(16 * sps->mb_width, |
497 | 16 * sps->mb_height, 0, avctx)) { |
498 | av_log(avctx, AV_LOG_ERROR, "mb_width/height overflow\n"); |
499 | goto fail; |
500 | } |
501 | |
502 | sps->direct_8x8_inference_flag = get_bits1(gb); |
503 | |
504 | #ifndef ALLOW_INTERLACE |
505 | if (sps->mb_aff) |
506 | av_log(avctx, AV_LOG_ERROR, |
507 | "MBAFF support not included; enable it at compile-time.\n"); |
508 | #endif |
509 | sps->crop = get_bits1(gb); |
510 | if (sps->crop) { |
511 | unsigned int crop_left = get_ue_golomb(gb); |
512 | unsigned int crop_right = get_ue_golomb(gb); |
513 | unsigned int crop_top = get_ue_golomb(gb); |
514 | unsigned int crop_bottom = get_ue_golomb(gb); |
515 | int width = 16 * sps->mb_width; |
516 | int height = 16 * sps->mb_height; |
517 | |
518 | if (avctx->flags2 & AV_CODEC_FLAG2_IGNORE_CROP) { |
519 | av_log(avctx, AV_LOG_DEBUG, "discarding sps cropping, original " |
520 | "values are l:%d r:%d t:%d b:%d\n", |
521 | crop_left, crop_right, crop_top, crop_bottom); |
522 | |
523 | sps->crop_left = |
524 | sps->crop_right = |
525 | sps->crop_top = |
526 | sps->crop_bottom = 0; |
527 | } else { |
528 | int vsub = (sps->chroma_format_idc == 1) ? 1 : 0; |
529 | int hsub = (sps->chroma_format_idc == 1 || |
530 | sps->chroma_format_idc == 2) ? 1 : 0; |
531 | int step_x = 1 << hsub; |
532 | int step_y = (2 - sps->frame_mbs_only_flag) << vsub; |
533 | |
534 | if (crop_left & (0x1F >> (sps->bit_depth_luma > 8)) && |
535 | !(avctx->flags & AV_CODEC_FLAG_UNALIGNED)) { |
536 | crop_left &= ~(0x1F >> (sps->bit_depth_luma > 8)); |
537 | av_log(avctx, AV_LOG_WARNING, |
538 | "Reducing left cropping to %d " |
539 | "chroma samples to preserve alignment.\n", |
540 | crop_left); |
541 | } |
542 | |
543 | if (crop_left > (unsigned)INT_MAX / 4 / step_x || |
544 | crop_right > (unsigned)INT_MAX / 4 / step_x || |
545 | crop_top > (unsigned)INT_MAX / 4 / step_y || |
546 | crop_bottom> (unsigned)INT_MAX / 4 / step_y || |
547 | (crop_left + crop_right ) * step_x >= width || |
548 | (crop_top + crop_bottom) * step_y >= height |
549 | ) { |
550 | av_log(avctx, AV_LOG_ERROR, "crop values invalid %d %d %d %d / %d %d\n", crop_left, crop_right, crop_top, crop_bottom, width, height); |
551 | goto fail; |
552 | } |
553 | |
554 | sps->crop_left = crop_left * step_x; |
555 | sps->crop_right = crop_right * step_x; |
556 | sps->crop_top = crop_top * step_y; |
557 | sps->crop_bottom = crop_bottom * step_y; |
558 | } |
559 | } else { |
560 | sps->crop_left = |
561 | sps->crop_right = |
562 | sps->crop_top = |
563 | sps->crop_bottom = |
564 | sps->crop = 0; |
565 | } |
566 | |
567 | sps->vui_parameters_present_flag = get_bits1(gb); |
568 | if (sps->vui_parameters_present_flag) { |
569 | int ret = decode_vui_parameters(gb, avctx, sps); |
570 | if (ret < 0) |
571 | goto fail; |
572 | } |
573 | |
574 | if (get_bits_left(gb) < 0) { |
575 | av_log(avctx, ignore_truncation ? AV_LOG_WARNING : AV_LOG_ERROR, |
576 | "Overread %s by %d bits\n", sps->vui_parameters_present_flag ? "VUI" : "SPS", -get_bits_left(gb)); |
577 | if (!ignore_truncation) |
578 | goto fail; |
579 | } |
580 | |
581 | /* if the maximum delay is not stored in the SPS, derive it based on the |
582 | * level */ |
583 | if (!sps->bitstream_restriction_flag && |
584 | (sps->ref_frame_count || avctx->strict_std_compliance >= FF_COMPLIANCE_STRICT)) { |
585 | sps->num_reorder_frames = MAX_DELAYED_PIC_COUNT - 1; |
586 | for (i = 0; i < FF_ARRAY_ELEMS(level_max_dpb_mbs); i++) { |
587 | if (level_max_dpb_mbs[i][0] == sps->level_idc) { |
588 | sps->num_reorder_frames = FFMIN(level_max_dpb_mbs[i][1] / (sps->mb_width * sps->mb_height), |
589 | sps->num_reorder_frames); |
590 | break; |
591 | } |
592 | } |
593 | } |
594 | |
595 | if (!sps->sar.den) |
596 | sps->sar.den = 1; |
597 | |
598 | if (avctx->debug & FF_DEBUG_PICT_INFO) { |
599 | static const char csp[4][5] = { "Gray", "420", "422", "444" }; |
600 | av_log(avctx, AV_LOG_DEBUG, |
601 | "sps:%u profile:%d/%d poc:%d ref:%d %dx%d %s %s crop:%u/%u/%u/%u %s %s %"PRId32"/%"PRId32" b%d reo:%d\n", |
602 | sps_id, sps->profile_idc, sps->level_idc, |
603 | sps->poc_type, |
604 | sps->ref_frame_count, |
605 | sps->mb_width, sps->mb_height, |
606 | sps->frame_mbs_only_flag ? "FRM" : (sps->mb_aff ? "MB-AFF" : "PIC-AFF"), |
607 | sps->direct_8x8_inference_flag ? "8B8" : "", |
608 | sps->crop_left, sps->crop_right, |
609 | sps->crop_top, sps->crop_bottom, |
610 | sps->vui_parameters_present_flag ? "VUI" : "", |
611 | csp[sps->chroma_format_idc], |
612 | sps->timing_info_present_flag ? sps->num_units_in_tick : 0, |
613 | sps->timing_info_present_flag ? sps->time_scale : 0, |
614 | sps->bit_depth_luma, |
615 | sps->bitstream_restriction_flag ? sps->num_reorder_frames : -1 |
616 | ); |
617 | } |
618 | |
619 | /* check if this is a repeat of an already parsed SPS, then keep the |
620 | * original one. |
621 | * otherwise drop all PPSes that depend on it */ |
622 | if (ps->sps_list[sps_id] && |
623 | !memcmp(ps->sps_list[sps_id]->data, sps_buf->data, sps_buf->size)) { |
624 | av_buffer_unref(&sps_buf); |
625 | } else { |
626 | remove_sps(ps, sps_id); |
627 | ps->sps_list[sps_id] = sps_buf; |
628 | } |
629 | |
630 | return 0; |
631 | |
632 | fail: |
633 | av_buffer_unref(&sps_buf); |
634 | return AVERROR_INVALIDDATA; |
635 | } |
636 | |
637 | static void init_dequant8_coeff_table(PPS *pps, const SPS *sps) |
638 | { |
639 | int i, j, q, x; |
640 | const int max_qp = 51 + 6 * (sps->bit_depth_luma - 8); |
641 | |
642 | for (i = 0; i < 6; i++) { |
643 | pps->dequant8_coeff[i] = pps->dequant8_buffer[i]; |
644 | for (j = 0; j < i; j++) |
645 | if (!memcmp(pps->scaling_matrix8[j], pps->scaling_matrix8[i], |
646 | 64 * sizeof(uint8_t))) { |
647 | pps->dequant8_coeff[i] = pps->dequant8_buffer[j]; |
648 | break; |
649 | } |
650 | if (j < i) |
651 | continue; |
652 | |
653 | for (q = 0; q < max_qp + 1; q++) { |
654 | int shift = ff_h264_quant_div6[q]; |
655 | int idx = ff_h264_quant_rem6[q]; |
656 | for (x = 0; x < 64; x++) |
657 | pps->dequant8_coeff[i][q][(x >> 3) | ((x & 7) << 3)] = |
658 | ((uint32_t)ff_h264_dequant8_coeff_init[idx][ff_h264_dequant8_coeff_init_scan[((x >> 1) & 12) | (x & 3)]] * |
659 | pps->scaling_matrix8[i][x]) << shift; |
660 | } |
661 | } |
662 | } |
663 | |
664 | static void init_dequant4_coeff_table(PPS *pps, const SPS *sps) |
665 | { |
666 | int i, j, q, x; |
667 | const int max_qp = 51 + 6 * (sps->bit_depth_luma - 8); |
668 | for (i = 0; i < 6; i++) { |
669 | pps->dequant4_coeff[i] = pps->dequant4_buffer[i]; |
670 | for (j = 0; j < i; j++) |
671 | if (!memcmp(pps->scaling_matrix4[j], pps->scaling_matrix4[i], |
672 | 16 * sizeof(uint8_t))) { |
673 | pps->dequant4_coeff[i] = pps->dequant4_buffer[j]; |
674 | break; |
675 | } |
676 | if (j < i) |
677 | continue; |
678 | |
679 | for (q = 0; q < max_qp + 1; q++) { |
680 | int shift = ff_h264_quant_div6[q] + 2; |
681 | int idx = ff_h264_quant_rem6[q]; |
682 | for (x = 0; x < 16; x++) |
683 | pps->dequant4_coeff[i][q][(x >> 2) | ((x << 2) & 0xF)] = |
684 | ((uint32_t)ff_h264_dequant4_coeff_init[idx][(x & 1) + ((x >> 2) & 1)] * |
685 | pps->scaling_matrix4[i][x]) << shift; |
686 | } |
687 | } |
688 | } |
689 | |
690 | static void init_dequant_tables(PPS *pps, const SPS *sps) |
691 | { |
692 | int i, x; |
693 | init_dequant4_coeff_table(pps, sps); |
694 | memset(pps->dequant8_coeff, 0, sizeof(pps->dequant8_coeff)); |
695 | |
696 | if (pps->transform_8x8_mode) |
697 | init_dequant8_coeff_table(pps, sps); |
698 | if (sps->transform_bypass) { |
699 | for (i = 0; i < 6; i++) |
700 | for (x = 0; x < 16; x++) |
701 | pps->dequant4_coeff[i][0][x] = 1 << 6; |
702 | if (pps->transform_8x8_mode) |
703 | for (i = 0; i < 6; i++) |
704 | for (x = 0; x < 64; x++) |
705 | pps->dequant8_coeff[i][0][x] = 1 << 6; |
706 | } |
707 | } |
708 | |
709 | static void build_qp_table(PPS *pps, int t, int index, const int depth) |
710 | { |
711 | int i; |
712 | const int max_qp = 51 + 6 * (depth - 8); |
713 | for (i = 0; i < max_qp + 1; i++) |
714 | pps->chroma_qp_table[t][i] = |
715 | ff_h264_chroma_qp[depth - 8][av_clip(i + index, 0, max_qp)]; |
716 | } |
717 | |
718 | static int more_rbsp_data_in_pps(const SPS *sps, void *logctx) |
719 | { |
720 | int profile_idc = sps->profile_idc; |
721 | |
722 | if ((profile_idc == 66 || profile_idc == 77 || |
723 | profile_idc == 88) && (sps->constraint_set_flags & 7)) { |
724 | av_log(logctx, AV_LOG_VERBOSE, |
725 | "Current profile doesn't provide more RBSP data in PPS, skipping\n"); |
726 | return 0; |
727 | } |
728 | |
729 | return 1; |
730 | } |
731 | |
732 | int ff_h264_decode_picture_parameter_set(GetBitContext *gb, AVCodecContext *avctx, |
733 | H264ParamSets *ps, int bit_length) |
734 | { |
735 | AVBufferRef *pps_buf; |
736 | const SPS *sps; |
737 | unsigned int pps_id = get_ue_golomb(gb); |
738 | PPS *pps; |
739 | int qp_bd_offset; |
740 | int bits_left; |
741 | int ret; |
742 | |
743 | if (pps_id >= MAX_PPS_COUNT) { |
744 | av_log(avctx, AV_LOG_ERROR, "pps_id %u out of range\n", pps_id); |
745 | return AVERROR_INVALIDDATA; |
746 | } |
747 | |
748 | pps_buf = av_buffer_allocz(sizeof(*pps)); |
749 | if (!pps_buf) |
750 | return AVERROR(ENOMEM); |
751 | pps = (PPS*)pps_buf->data; |
752 | |
753 | pps->data_size = gb->buffer_end - gb->buffer; |
754 | if (pps->data_size > sizeof(pps->data)) { |
755 | av_log(avctx, AV_LOG_WARNING, "Truncating likely oversized PPS " |
756 | "(%"SIZE_SPECIFIER" > %"SIZE_SPECIFIER")\n", |
757 | pps->data_size, sizeof(pps->data)); |
758 | pps->data_size = sizeof(pps->data); |
759 | } |
760 | memcpy(pps->data, gb->buffer, pps->data_size); |
761 | |
762 | pps->sps_id = get_ue_golomb_31(gb); |
763 | if ((unsigned)pps->sps_id >= MAX_SPS_COUNT || |
764 | !ps->sps_list[pps->sps_id]) { |
765 | av_log(avctx, AV_LOG_ERROR, "sps_id %u out of range\n", pps->sps_id); |
766 | ret = AVERROR_INVALIDDATA; |
767 | goto fail; |
768 | } |
769 | sps = (const SPS*)ps->sps_list[pps->sps_id]->data; |
770 | if (sps->bit_depth_luma > 14) { |
771 | av_log(avctx, AV_LOG_ERROR, |
772 | "Invalid luma bit depth=%d\n", |
773 | sps->bit_depth_luma); |
774 | ret = AVERROR_INVALIDDATA; |
775 | goto fail; |
776 | } else if (sps->bit_depth_luma == 11 || sps->bit_depth_luma == 13) { |
777 | avpriv_report_missing_feature(avctx, |
778 | "Unimplemented luma bit depth=%d", |
779 | sps->bit_depth_luma); |
780 | ret = AVERROR_PATCHWELCOME; |
781 | goto fail; |
782 | } |
783 | |
784 | pps->cabac = get_bits1(gb); |
785 | pps->pic_order_present = get_bits1(gb); |
786 | pps->slice_group_count = get_ue_golomb(gb) + 1; |
787 | if (pps->slice_group_count > 1) { |
788 | pps->mb_slice_group_map_type = get_ue_golomb(gb); |
789 | av_log(avctx, AV_LOG_ERROR, "FMO not supported\n"); |
790 | } |
791 | pps->ref_count[0] = get_ue_golomb(gb) + 1; |
792 | pps->ref_count[1] = get_ue_golomb(gb) + 1; |
793 | if (pps->ref_count[0] - 1 > 32 - 1 || pps->ref_count[1] - 1 > 32 - 1) { |
794 | av_log(avctx, AV_LOG_ERROR, "reference overflow (pps)\n"); |
795 | ret = AVERROR_INVALIDDATA; |
796 | goto fail; |
797 | } |
798 | |
799 | qp_bd_offset = 6 * (sps->bit_depth_luma - 8); |
800 | |
801 | pps->weighted_pred = get_bits1(gb); |
802 | pps->weighted_bipred_idc = get_bits(gb, 2); |
803 | pps->init_qp = get_se_golomb(gb) + 26U + qp_bd_offset; |
804 | pps->init_qs = get_se_golomb(gb) + 26U + qp_bd_offset; |
805 | pps->chroma_qp_index_offset[0] = get_se_golomb(gb); |
806 | if (pps->chroma_qp_index_offset[0] < -12 || pps->chroma_qp_index_offset[0] > 12) { |
807 | ret = AVERROR_INVALIDDATA; |
808 | goto fail; |
809 | } |
810 | |
811 | pps->deblocking_filter_parameters_present = get_bits1(gb); |
812 | pps->constrained_intra_pred = get_bits1(gb); |
813 | pps->redundant_pic_cnt_present = get_bits1(gb); |
814 | |
815 | pps->transform_8x8_mode = 0; |
816 | memcpy(pps->scaling_matrix4, sps->scaling_matrix4, |
817 | sizeof(pps->scaling_matrix4)); |
818 | memcpy(pps->scaling_matrix8, sps->scaling_matrix8, |
819 | sizeof(pps->scaling_matrix8)); |
820 | |
821 | bits_left = bit_length - get_bits_count(gb); |
822 | if (bits_left > 0 && more_rbsp_data_in_pps(sps, avctx)) { |
823 | pps->transform_8x8_mode = get_bits1(gb); |
824 | ret = decode_scaling_matrices(gb, sps, pps, 0, |
825 | pps->scaling_matrix4, pps->scaling_matrix8); |
826 | if (ret < 0) |
827 | goto fail; |
828 | // second_chroma_qp_index_offset |
829 | pps->chroma_qp_index_offset[1] = get_se_golomb(gb); |
830 | if (pps->chroma_qp_index_offset[1] < -12 || pps->chroma_qp_index_offset[1] > 12) { |
831 | ret = AVERROR_INVALIDDATA; |
832 | goto fail; |
833 | } |
834 | } else { |
835 | pps->chroma_qp_index_offset[1] = pps->chroma_qp_index_offset[0]; |
836 | } |
837 | |
838 | build_qp_table(pps, 0, pps->chroma_qp_index_offset[0], |
839 | sps->bit_depth_luma); |
840 | build_qp_table(pps, 1, pps->chroma_qp_index_offset[1], |
841 | sps->bit_depth_luma); |
842 | |
843 | init_dequant_tables(pps, sps); |
844 | |
845 | if (pps->chroma_qp_index_offset[0] != pps->chroma_qp_index_offset[1]) |
846 | pps->chroma_qp_diff = 1; |
847 | |
848 | if (avctx->debug & FF_DEBUG_PICT_INFO) { |
849 | av_log(avctx, AV_LOG_DEBUG, |
850 | "pps:%u sps:%u %s slice_groups:%d ref:%u/%u %s qp:%d/%d/%d/%d %s %s %s %s\n", |
851 | pps_id, pps->sps_id, |
852 | pps->cabac ? "CABAC" : "CAVLC", |
853 | pps->slice_group_count, |
854 | pps->ref_count[0], pps->ref_count[1], |
855 | pps->weighted_pred ? "weighted" : "", |
856 | pps->init_qp, pps->init_qs, pps->chroma_qp_index_offset[0], pps->chroma_qp_index_offset[1], |
857 | pps->deblocking_filter_parameters_present ? "LPAR" : "", |
858 | pps->constrained_intra_pred ? "CONSTR" : "", |
859 | pps->redundant_pic_cnt_present ? "REDU" : "", |
860 | pps->transform_8x8_mode ? "8x8DCT" : ""); |
861 | } |
862 | |
863 | remove_pps(ps, pps_id); |
864 | ps->pps_list[pps_id] = pps_buf; |
865 | |
866 | return 0; |
867 | |
868 | fail: |
869 | av_buffer_unref(&pps_buf); |
870 | return ret; |
871 | } |
872 |