avformat/mpeg: demux ivtv captions
[ffmpeg.git] / libavcodec / h264_parse.c
blobc6f9b3cea753be766ae753cee2817ad6ff9d19a9
1 /*
2 * This file is part of FFmpeg.
4 * FFmpeg is free software; you can redistribute it and/or
5 * modify it under the terms of the GNU Lesser General Public
6 * License as published by the Free Software Foundation; either
7 * version 2.1 of the License, or (at your option) any later version.
9 * FFmpeg is distributed in the hope that it will be useful,
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
12 * Lesser General Public License for more details.
14 * You should have received a copy of the GNU Lesser General Public
15 * License along with FFmpeg; if not, write to the Free Software
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19 #include "libavutil/mem.h"
20 #include "bytestream.h"
21 #include "get_bits.h"
22 #include "golomb.h"
23 #include "h264.h"
24 #include "h264pred.h"
25 #include "h264_parse.h"
26 #include "h264_ps.h"
27 #include "h2645_parse.h"
28 #include "mpegutils.h"
30 int ff_h264_pred_weight_table(GetBitContext *gb, const SPS *sps,
31 const int *ref_count, int slice_type_nos,
32 H264PredWeightTable *pwt,
33 int picture_structure, void *logctx)
35 int list, i, j;
36 int luma_def, chroma_def;
38 pwt->use_weight = 0;
39 pwt->use_weight_chroma = 0;
41 pwt->luma_log2_weight_denom = get_ue_golomb_31(gb);
42 if (pwt->luma_log2_weight_denom > 7U) {
43 av_log(logctx, AV_LOG_ERROR, "luma_log2_weight_denom %d is out of range\n", pwt->luma_log2_weight_denom);
44 pwt->luma_log2_weight_denom = 0;
46 luma_def = 1 << pwt->luma_log2_weight_denom;
48 if (sps->chroma_format_idc) {
49 pwt->chroma_log2_weight_denom = get_ue_golomb_31(gb);
50 if (pwt->chroma_log2_weight_denom > 7U) {
51 av_log(logctx, AV_LOG_ERROR, "chroma_log2_weight_denom %d is out of range\n", pwt->chroma_log2_weight_denom);
52 pwt->chroma_log2_weight_denom = 0;
54 chroma_def = 1 << pwt->chroma_log2_weight_denom;
57 for (list = 0; list < 2; list++) {
58 pwt->luma_weight_flag[list] = 0;
59 pwt->chroma_weight_flag[list] = 0;
60 for (i = 0; i < ref_count[list]; i++) {
61 int luma_weight_flag, chroma_weight_flag;
63 luma_weight_flag = get_bits1(gb);
64 if (luma_weight_flag) {
65 pwt->luma_weight[i][list][0] = get_se_golomb(gb);
66 pwt->luma_weight[i][list][1] = get_se_golomb(gb);
67 if ((int8_t)pwt->luma_weight[i][list][0] != pwt->luma_weight[i][list][0] ||
68 (int8_t)pwt->luma_weight[i][list][1] != pwt->luma_weight[i][list][1])
69 goto out_range_weight;
70 if (pwt->luma_weight[i][list][0] != luma_def ||
71 pwt->luma_weight[i][list][1] != 0) {
72 pwt->use_weight = 1;
73 pwt->luma_weight_flag[list] = 1;
75 } else {
76 pwt->luma_weight[i][list][0] = luma_def;
77 pwt->luma_weight[i][list][1] = 0;
80 if (sps->chroma_format_idc) {
81 chroma_weight_flag = get_bits1(gb);
82 if (chroma_weight_flag) {
83 int j;
84 for (j = 0; j < 2; j++) {
85 pwt->chroma_weight[i][list][j][0] = get_se_golomb(gb);
86 pwt->chroma_weight[i][list][j][1] = get_se_golomb(gb);
87 if ((int8_t)pwt->chroma_weight[i][list][j][0] != pwt->chroma_weight[i][list][j][0] ||
88 (int8_t)pwt->chroma_weight[i][list][j][1] != pwt->chroma_weight[i][list][j][1]) {
89 pwt->chroma_weight[i][list][j][0] = chroma_def;
90 pwt->chroma_weight[i][list][j][1] = 0;
91 goto out_range_weight;
93 if (pwt->chroma_weight[i][list][j][0] != chroma_def ||
94 pwt->chroma_weight[i][list][j][1] != 0) {
95 pwt->use_weight_chroma = 1;
96 pwt->chroma_weight_flag[list] = 1;
99 } else {
100 int j;
101 for (j = 0; j < 2; j++) {
102 pwt->chroma_weight[i][list][j][0] = chroma_def;
103 pwt->chroma_weight[i][list][j][1] = 0;
108 // for MBAFF
109 if (picture_structure == PICT_FRAME) {
110 pwt->luma_weight[16 + 2 * i][list][0] = pwt->luma_weight[16 + 2 * i + 1][list][0] = pwt->luma_weight[i][list][0];
111 pwt->luma_weight[16 + 2 * i][list][1] = pwt->luma_weight[16 + 2 * i + 1][list][1] = pwt->luma_weight[i][list][1];
112 if (sps->chroma_format_idc) {
113 for (j = 0; j < 2; j++) {
114 pwt->chroma_weight[16 + 2 * i][list][j][0] = pwt->chroma_weight[16 + 2 * i + 1][list][j][0] = pwt->chroma_weight[i][list][j][0];
115 pwt->chroma_weight[16 + 2 * i][list][j][1] = pwt->chroma_weight[16 + 2 * i + 1][list][j][1] = pwt->chroma_weight[i][list][j][1];
120 if (slice_type_nos != AV_PICTURE_TYPE_B)
121 break;
123 pwt->use_weight = pwt->use_weight || pwt->use_weight_chroma;
124 return 0;
125 out_range_weight:
126 avpriv_request_sample(logctx, "Out of range weight");
127 return AVERROR_INVALIDDATA;
131 * Check if the top & left blocks are available if needed and
132 * change the dc mode so it only uses the available blocks.
134 int ff_h264_check_intra4x4_pred_mode(int8_t *pred_mode_cache, void *logctx,
135 int top_samples_available, int left_samples_available)
137 static const int8_t top[12] = {
138 -1, 0, LEFT_DC_PRED, -1, -1, -1, -1, -1, 0
140 static const int8_t left[12] = {
141 0, -1, TOP_DC_PRED, 0, -1, -1, -1, 0, -1, DC_128_PRED
143 int i;
145 if (!(top_samples_available & 0x8000)) {
146 for (i = 0; i < 4; i++) {
147 int status = top[pred_mode_cache[scan8[0] + i]];
148 if (status < 0) {
149 av_log(logctx, AV_LOG_ERROR,
150 "top block unavailable for requested intra mode %d\n",
151 status);
152 return AVERROR_INVALIDDATA;
153 } else if (status) {
154 pred_mode_cache[scan8[0] + i] = status;
159 if ((left_samples_available & 0x8888) != 0x8888) {
160 static const int mask[4] = { 0x8000, 0x2000, 0x80, 0x20 };
161 for (i = 0; i < 4; i++)
162 if (!(left_samples_available & mask[i])) {
163 int status = left[pred_mode_cache[scan8[0] + 8 * i]];
164 if (status < 0) {
165 av_log(logctx, AV_LOG_ERROR,
166 "left block unavailable for requested intra4x4 mode %d\n",
167 status);
168 return AVERROR_INVALIDDATA;
169 } else if (status) {
170 pred_mode_cache[scan8[0] + 8 * i] = status;
175 return 0;
179 * Check if the top & left blocks are available if needed and
180 * change the dc mode so it only uses the available blocks.
182 int ff_h264_check_intra_pred_mode(void *logctx, int top_samples_available,
183 int left_samples_available,
184 int mode, int is_chroma)
186 static const int8_t top[4] = { LEFT_DC_PRED8x8, 1, -1, -1 };
187 static const int8_t left[5] = { TOP_DC_PRED8x8, -1, 2, -1, DC_128_PRED8x8 };
189 if (mode > 3U) {
190 av_log(logctx, AV_LOG_ERROR,
191 "out of range intra chroma pred mode\n");
192 return AVERROR_INVALIDDATA;
195 if (!(top_samples_available & 0x8000)) {
196 mode = top[mode];
197 if (mode < 0) {
198 av_log(logctx, AV_LOG_ERROR,
199 "top block unavailable for requested intra mode\n");
200 return AVERROR_INVALIDDATA;
204 if ((left_samples_available & 0x8080) != 0x8080) {
205 mode = left[mode];
206 if (mode < 0) {
207 av_log(logctx, AV_LOG_ERROR,
208 "left block unavailable for requested intra mode\n");
209 return AVERROR_INVALIDDATA;
211 if (is_chroma && (left_samples_available & 0x8080)) {
212 // mad cow disease mode, aka MBAFF + constrained_intra_pred
213 mode = ALZHEIMER_DC_L0T_PRED8x8 +
214 (!(left_samples_available & 0x8000)) +
215 2 * (mode == DC_128_PRED8x8);
219 return mode;
222 int ff_h264_parse_ref_count(int *plist_count, int ref_count[2],
223 GetBitContext *gb, const PPS *pps,
224 int slice_type_nos, int picture_structure, void *logctx)
226 int list_count;
227 int num_ref_idx_active_override_flag;
229 // set defaults, might be overridden a few lines later
230 ref_count[0] = pps->ref_count[0];
231 ref_count[1] = pps->ref_count[1];
233 if (slice_type_nos != AV_PICTURE_TYPE_I) {
234 unsigned max[2];
235 max[0] = max[1] = picture_structure == PICT_FRAME ? 15 : 31;
237 num_ref_idx_active_override_flag = get_bits1(gb);
239 if (num_ref_idx_active_override_flag) {
240 ref_count[0] = get_ue_golomb(gb) + 1;
241 if (slice_type_nos == AV_PICTURE_TYPE_B) {
242 ref_count[1] = get_ue_golomb(gb) + 1;
243 } else
244 // full range is spec-ok in this case, even for frames
245 ref_count[1] = 1;
248 if (slice_type_nos == AV_PICTURE_TYPE_B)
249 list_count = 2;
250 else
251 list_count = 1;
253 if (ref_count[0] - 1 > max[0] || (list_count == 2 && (ref_count[1] - 1 > max[1]))) {
254 av_log(logctx, AV_LOG_ERROR, "reference overflow %u > %u or %u > %u\n",
255 ref_count[0] - 1, max[0], ref_count[1] - 1, max[1]);
256 ref_count[0] = ref_count[1] = 0;
257 *plist_count = 0;
258 goto fail;
259 } else if (ref_count[1] - 1 > max[1]) {
260 av_log(logctx, AV_LOG_DEBUG, "reference overflow %u > %u \n",
261 ref_count[1] - 1, max[1]);
262 ref_count[1] = 0;
265 } else {
266 list_count = 0;
267 ref_count[0] = ref_count[1] = 0;
270 *plist_count = list_count;
272 return 0;
273 fail:
274 *plist_count = 0;
275 ref_count[0] = 0;
276 ref_count[1] = 0;
277 return AVERROR_INVALIDDATA;
280 int ff_h264_init_poc(int pic_field_poc[2], int *pic_poc,
281 const SPS *sps, H264POCContext *pc,
282 int picture_structure, int nal_ref_idc)
284 const int max_frame_num = 1 << sps->log2_max_frame_num;
285 int64_t field_poc[2];
287 pc->frame_num_offset = pc->prev_frame_num_offset;
288 if (pc->frame_num < pc->prev_frame_num)
289 pc->frame_num_offset += max_frame_num;
291 if (sps->poc_type == 0) {
292 const int max_poc_lsb = 1 << sps->log2_max_poc_lsb;
293 if (pc->prev_poc_lsb < 0)
294 pc->prev_poc_lsb = pc->poc_lsb;
296 if (pc->poc_lsb < pc->prev_poc_lsb &&
297 pc->prev_poc_lsb - pc->poc_lsb >= max_poc_lsb / 2)
298 pc->poc_msb = pc->prev_poc_msb + max_poc_lsb;
299 else if (pc->poc_lsb > pc->prev_poc_lsb &&
300 pc->prev_poc_lsb - pc->poc_lsb < -max_poc_lsb / 2)
301 pc->poc_msb = pc->prev_poc_msb - max_poc_lsb;
302 else
303 pc->poc_msb = pc->prev_poc_msb;
304 field_poc[0] =
305 field_poc[1] = pc->poc_msb + pc->poc_lsb;
306 if (picture_structure == PICT_FRAME)
307 field_poc[1] += pc->delta_poc_bottom;
308 } else if (sps->poc_type == 1) {
309 int abs_frame_num;
310 int64_t expected_delta_per_poc_cycle, expectedpoc;
311 int i;
313 if (sps->poc_cycle_length != 0)
314 abs_frame_num = pc->frame_num_offset + pc->frame_num;
315 else
316 abs_frame_num = 0;
318 if (nal_ref_idc == 0 && abs_frame_num > 0)
319 abs_frame_num--;
321 expected_delta_per_poc_cycle = 0;
322 for (i = 0; i < sps->poc_cycle_length; i++)
323 // FIXME integrate during sps parse
324 expected_delta_per_poc_cycle += sps->offset_for_ref_frame[i];
326 if (abs_frame_num > 0) {
327 int poc_cycle_cnt = (abs_frame_num - 1) / sps->poc_cycle_length;
328 int frame_num_in_poc_cycle = (abs_frame_num - 1) % sps->poc_cycle_length;
330 expectedpoc = poc_cycle_cnt * expected_delta_per_poc_cycle;
331 for (i = 0; i <= frame_num_in_poc_cycle; i++)
332 expectedpoc = expectedpoc + sps->offset_for_ref_frame[i];
333 } else
334 expectedpoc = 0;
336 if (nal_ref_idc == 0)
337 expectedpoc = expectedpoc + sps->offset_for_non_ref_pic;
339 field_poc[0] = expectedpoc + pc->delta_poc[0];
340 field_poc[1] = field_poc[0] + sps->offset_for_top_to_bottom_field;
342 if (picture_structure == PICT_FRAME)
343 field_poc[1] += pc->delta_poc[1];
344 } else {
345 int poc = 2 * (pc->frame_num_offset + pc->frame_num);
347 if (!nal_ref_idc)
348 poc--;
350 field_poc[0] = poc;
351 field_poc[1] = poc;
354 if ( field_poc[0] != (int)field_poc[0]
355 || field_poc[1] != (int)field_poc[1])
356 return AVERROR_INVALIDDATA;
358 if (picture_structure != PICT_BOTTOM_FIELD)
359 pic_field_poc[0] = field_poc[0];
360 if (picture_structure != PICT_TOP_FIELD)
361 pic_field_poc[1] = field_poc[1];
362 *pic_poc = FFMIN(pic_field_poc[0], pic_field_poc[1]);
364 return 0;
367 static int decode_extradata_ps(const uint8_t *data, int size, H264ParamSets *ps,
368 int is_avc, void *logctx)
370 H2645Packet pkt = { 0 };
371 int flags = (H2645_FLAG_IS_NALFF * !!is_avc) | H2645_FLAG_SMALL_PADDING;
372 int i, ret = 0;
374 ret = ff_h2645_packet_split(&pkt, data, size, logctx, 2, AV_CODEC_ID_H264, flags);
375 if (ret < 0) {
376 ret = 0;
377 goto fail;
380 for (i = 0; i < pkt.nb_nals; i++) {
381 H2645NAL *nal = &pkt.nals[i];
382 switch (nal->type) {
383 case H264_NAL_SPS: {
384 GetBitContext tmp_gb = nal->gb;
385 ret = ff_h264_decode_seq_parameter_set(&tmp_gb, logctx, ps, 0);
386 if (ret >= 0)
387 break;
388 av_log(logctx, AV_LOG_DEBUG,
389 "SPS decoding failure, trying again with the complete NAL\n");
390 init_get_bits8(&tmp_gb, nal->raw_data + 1, nal->raw_size - 1);
391 ret = ff_h264_decode_seq_parameter_set(&tmp_gb, logctx, ps, 0);
392 if (ret >= 0)
393 break;
394 ret = ff_h264_decode_seq_parameter_set(&nal->gb, logctx, ps, 1);
395 if (ret < 0)
396 goto fail;
397 break;
399 case H264_NAL_PPS:
400 ret = ff_h264_decode_picture_parameter_set(&nal->gb, logctx, ps,
401 nal->size_bits);
402 if (ret < 0)
403 goto fail;
404 break;
405 default:
406 av_log(logctx, AV_LOG_VERBOSE, "Ignoring NAL type %d in extradata\n",
407 nal->type);
408 break;
412 fail:
413 ff_h2645_packet_uninit(&pkt);
414 return ret;
417 /* There are (invalid) samples in the wild with mp4-style extradata, where the
418 * parameter sets are stored unescaped (i.e. as RBSP).
419 * This function catches the parameter set decoding failure and tries again
420 * after escaping it */
421 static int decode_extradata_ps_mp4(const uint8_t *buf, int buf_size, H264ParamSets *ps,
422 int err_recognition, void *logctx)
424 int ret;
426 ret = decode_extradata_ps(buf, buf_size, ps, 1, logctx);
427 if (ret < 0 && !(err_recognition & AV_EF_EXPLODE)) {
428 GetByteContext gbc;
429 PutByteContext pbc;
430 uint8_t *escaped_buf;
431 int escaped_buf_size;
433 av_log(logctx, AV_LOG_WARNING,
434 "SPS decoding failure, trying again after escaping the NAL\n");
436 if (buf_size / 2 >= (INT16_MAX - AV_INPUT_BUFFER_PADDING_SIZE) / 3)
437 return AVERROR(ERANGE);
438 escaped_buf_size = buf_size * 3 / 2 + AV_INPUT_BUFFER_PADDING_SIZE;
439 escaped_buf = av_mallocz(escaped_buf_size);
440 if (!escaped_buf)
441 return AVERROR(ENOMEM);
443 bytestream2_init(&gbc, buf, buf_size);
444 bytestream2_init_writer(&pbc, escaped_buf, escaped_buf_size);
446 while (bytestream2_get_bytes_left(&gbc)) {
447 if (bytestream2_get_bytes_left(&gbc) >= 3 &&
448 bytestream2_peek_be24(&gbc) <= 3) {
449 bytestream2_put_be24(&pbc, 3);
450 bytestream2_skip(&gbc, 2);
451 } else
452 bytestream2_put_byte(&pbc, bytestream2_get_byte(&gbc));
455 escaped_buf_size = bytestream2_tell_p(&pbc);
456 AV_WB16(escaped_buf, escaped_buf_size - 2);
458 (void)decode_extradata_ps(escaped_buf, escaped_buf_size, ps, 1, logctx);
459 // lorex.mp4 decodes ok even with extradata decoding failing
460 av_freep(&escaped_buf);
463 return 0;
466 int ff_h264_decode_extradata(const uint8_t *data, int size, H264ParamSets *ps,
467 int *is_avc, int *nal_length_size,
468 int err_recognition, void *logctx)
470 int ret;
472 if (!data || size <= 0)
473 return AVERROR(EINVAL);
475 if (data[0] == 1) {
476 int i, cnt, nalsize;
477 const uint8_t *p = data;
479 *is_avc = 1;
481 if (size < 7) {
482 av_log(logctx, AV_LOG_ERROR, "avcC %d too short\n", size);
483 return AVERROR_INVALIDDATA;
486 // Decode sps from avcC
487 cnt = *(p + 5) & 0x1f; // Number of sps
488 p += 6;
489 for (i = 0; i < cnt; i++) {
490 nalsize = AV_RB16(p) + 2;
491 if (nalsize > size - (p - data))
492 return AVERROR_INVALIDDATA;
493 ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
494 if (ret < 0) {
495 av_log(logctx, AV_LOG_ERROR,
496 "Decoding sps %d from avcC failed\n", i);
497 return ret;
499 p += nalsize;
501 // Decode pps from avcC
502 cnt = *(p++); // Number of pps
503 for (i = 0; i < cnt; i++) {
504 nalsize = AV_RB16(p) + 2;
505 if (nalsize > size - (p - data))
506 return AVERROR_INVALIDDATA;
507 ret = decode_extradata_ps_mp4(p, nalsize, ps, err_recognition, logctx);
508 if (ret < 0) {
509 av_log(logctx, AV_LOG_ERROR,
510 "Decoding pps %d from avcC failed\n", i);
511 return ret;
513 p += nalsize;
515 // Store right nal length size that will be used to parse all other nals
516 *nal_length_size = (data[4] & 0x03) + 1;
517 } else {
518 *is_avc = 0;
519 ret = decode_extradata_ps(data, size, ps, 0, logctx);
520 if (ret < 0)
521 return ret;
523 return size;
527 * Compute profile from profile_idc and constraint_set?_flags.
529 * @param sps SPS
531 * @return profile as defined by AV_PROFILE_H264_*
533 int ff_h264_get_profile(const SPS *sps)
535 int profile = sps->profile_idc;
537 switch (sps->profile_idc) {
538 case AV_PROFILE_H264_BASELINE:
539 // constraint_set1_flag set to 1
540 profile |= (sps->constraint_set_flags & 1 << 1) ? AV_PROFILE_H264_CONSTRAINED : 0;
541 break;
542 case AV_PROFILE_H264_HIGH_10:
543 case AV_PROFILE_H264_HIGH_422:
544 case AV_PROFILE_H264_HIGH_444_PREDICTIVE:
545 // constraint_set3_flag set to 1
546 profile |= (sps->constraint_set_flags & 1 << 3) ? AV_PROFILE_H264_INTRA : 0;
547 break;
550 return profile;