FFmpeg
h264_parser.c
Go to the documentation of this file.
1 /*
2  * H.26L/H.264/AVC/JVT/14496-10/... parser
3  * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 /**
23  * @file
24  * H.264 / AVC / MPEG-4 part10 parser.
25  * @author Michael Niedermayer <michaelni@gmx.at>
26  */
27 
28 #define UNCHECKED_BITSTREAM_READER 1
29 
30 #include <stdint.h>
31 
32 #include "libavutil/attributes.h"
33 #include "libavutil/avutil.h"
34 #include "libavutil/error.h"
35 #include "libavutil/log.h"
36 #include "libavutil/mem.h"
37 #include "libavutil/pixfmt.h"
38 
39 #include "avcodec.h"
40 #include "get_bits.h"
41 #include "golomb.h"
42 #include "h264.h"
43 #include "h264dsp.h"
44 #include "h264_parse.h"
45 #include "h264_sei.h"
46 #include "h264_ps.h"
47 #include "h2645_parse.h"
48 #include "h264data.h"
49 #include "mpegutils.h"
50 #include "parser.h"
51 #include "libavutil/refstruct.h"
52 #include "startcode.h"
53 
54 typedef struct H264ParseContext {
60  int is_avc;
62  int got_first;
64  uint8_t parse_history[6];
70 
71 static int find_start_code(const uint8_t *buf, int buf_size,
72  int buf_index, int next_avc)
73 {
74  uint32_t state = -1;
75 
76  buf_index = avpriv_find_start_code(buf + buf_index, buf + next_avc + 1, &state) - buf - 1;
77 
78  return FFMIN(buf_index, buf_size);
79 }
80 
81 static int h264_find_frame_end(H264ParseContext *p, const uint8_t *buf,
82  int buf_size, void *logctx)
83 {
84  int i, j;
85  uint32_t state;
86  ParseContext *pc = &p->pc;
87 
88  int next_avc = p->is_avc ? 0 : buf_size;
89 // mb_addr= pc->mb_addr - 1;
90  state = pc->state;
91  if (state > 13)
92  state = 7;
93 
94  if (p->is_avc && !p->nal_length_size)
95  av_log(logctx, AV_LOG_ERROR, "AVC-parser: nal length size invalid\n");
96 
97  for (i = 0; i < buf_size; i++) {
98  if (i >= next_avc) {
99  int64_t nalsize = 0;
100  i = next_avc;
101  for (j = 0; j < p->nal_length_size; j++)
102  nalsize = (nalsize << 8) | buf[i++];
103  if (!nalsize || nalsize > buf_size - i) {
104  av_log(logctx, AV_LOG_ERROR, "AVC-parser: nal size %"PRId64" "
105  "remaining %d\n", nalsize, buf_size - i);
106  return buf_size;
107  }
108  next_avc = i + nalsize;
109  state = 5;
110  }
111 
112  if (state == 7) {
113  i += p->h264dsp.startcode_find_candidate(buf + i, next_avc - i);
114  if (i < next_avc)
115  state = 2;
116  } else if (state <= 2) {
117  if (buf[i] == 1)
118  state ^= 5; // 2->7, 1->4, 0->5
119  else if (buf[i])
120  state = 7;
121  else
122  state >>= 1; // 2->1, 1->0, 0->0
123  } else if (state <= 5) {
124  int nalu_type = buf[i] & 0x1F;
125  if (nalu_type == H264_NAL_SEI || nalu_type == H264_NAL_SPS ||
126  nalu_type == H264_NAL_PPS || nalu_type == H264_NAL_AUD) {
127  if (pc->frame_start_found) {
128  i++;
129  goto found;
130  }
131  } else if (nalu_type == H264_NAL_SLICE || nalu_type == H264_NAL_DPA ||
132  nalu_type == H264_NAL_IDR_SLICE) {
133  state += 8;
134  continue;
135  }
136  state = 7;
137  } else {
138  unsigned int mb, last_mb = p->parse_last_mb;
139  GetBitContext gb;
140  p->parse_history[p->parse_history_count++] = buf[i];
141 
142  init_get_bits(&gb, p->parse_history, 8*p->parse_history_count);
143  mb= get_ue_golomb_long(&gb);
144  if (get_bits_left(&gb) > 0 || p->parse_history_count > 5) {
145  p->parse_last_mb = mb;
146  if (pc->frame_start_found) {
147  if (mb <= last_mb) {
148  i -= p->parse_history_count - 1;
149  p->parse_history_count = 0;
150  goto found;
151  }
152  } else
153  pc->frame_start_found = 1;
154  p->parse_history_count = 0;
155  state = 7;
156  }
157  }
158  }
159  pc->state = state;
160  if (p->is_avc)
161  return next_avc;
162  return END_NOT_FOUND;
163 
164 found:
165  pc->state = 7;
166  pc->frame_start_found = 0;
167  if (p->is_avc)
168  return next_avc;
169  return i - (state & 5);
170 }
171 
173  void *logctx)
174 {
176  int slice_type_nos = s->pict_type & 3;
177  H264ParseContext *p = s->priv_data;
178  int list_count, ref_count[2];
179 
180 
181  if (p->ps.pps->redundant_pic_cnt_present)
182  get_ue_golomb(gb); // redundant_pic_count
183 
184  if (slice_type_nos == AV_PICTURE_TYPE_B)
185  get_bits1(gb); // direct_spatial_mv_pred
186 
187  if (ff_h264_parse_ref_count(&list_count, ref_count, gb, p->ps.pps,
188  slice_type_nos, p->picture_structure, logctx) < 0)
189  return AVERROR_INVALIDDATA;
190 
191  if (slice_type_nos != AV_PICTURE_TYPE_I) {
192  int list;
193  for (list = 0; list < list_count; list++) {
194  if (get_bits1(gb)) {
195  int index;
196  for (index = 0; ; index++) {
197  unsigned int reordering_of_pic_nums_idc = get_ue_golomb_31(gb);
198 
199  if (reordering_of_pic_nums_idc < 3)
200  get_ue_golomb_long(gb);
201  else if (reordering_of_pic_nums_idc > 3) {
202  av_log(logctx, AV_LOG_ERROR,
203  "illegal reordering_of_pic_nums_idc %d\n",
204  reordering_of_pic_nums_idc);
205  return AVERROR_INVALIDDATA;
206  } else
207  break;
208 
209  if (index >= ref_count[list]) {
210  av_log(logctx, AV_LOG_ERROR,
211  "reference count %d overflow\n", index);
212  return AVERROR_INVALIDDATA;
213  }
214  }
215  }
216  }
217  }
218 
219  if ((p->ps.pps->weighted_pred && slice_type_nos == AV_PICTURE_TYPE_P) ||
220  (p->ps.pps->weighted_bipred_idc == 1 && slice_type_nos == AV_PICTURE_TYPE_B))
221  ff_h264_pred_weight_table(gb, p->ps.sps, ref_count, slice_type_nos,
222  &pwt, p->picture_structure, logctx);
223 
224  if (get_bits1(gb)) { // adaptive_ref_pic_marking_mode_flag
225  int i;
226  for (i = 0; i < H264_MAX_MMCO_COUNT; i++) {
227  MMCOOpcode opcode = get_ue_golomb_31(gb);
228  if (opcode > (unsigned) MMCO_LONG) {
229  av_log(logctx, AV_LOG_ERROR,
230  "illegal memory management control operation %d\n",
231  opcode);
232  return AVERROR_INVALIDDATA;
233  }
234  if (opcode == MMCO_END)
235  return 0;
236  else if (opcode == MMCO_RESET)
237  return 1;
238 
239  if (opcode == MMCO_SHORT2UNUSED || opcode == MMCO_SHORT2LONG)
240  get_ue_golomb_long(gb); // difference_of_pic_nums_minus1
241  if (opcode == MMCO_SHORT2LONG || opcode == MMCO_LONG2UNUSED ||
242  opcode == MMCO_LONG || opcode == MMCO_SET_MAX_LONG)
243  get_ue_golomb_31(gb);
244  }
245  }
246 
247  return 0;
248 }
249 
250 /**
251  * Parse NAL units of found picture and decode some basic information.
252  *
253  * @param s parser context.
254  * @param avctx codec context.
255  * @param buf buffer with field/frame data.
256  * @param buf_size size of the buffer.
257  */
259  AVCodecContext *avctx,
260  const uint8_t * const buf, int buf_size)
261 {
262  H264ParseContext *p = s->priv_data;
263  H2645RBSP rbsp = { NULL };
264  H2645NAL nal = { NULL };
265  int buf_index, next_avc;
266  unsigned int pps_id;
267  unsigned int slice_type;
268  int state = -1, got_reset = 0;
269  int q264 = buf_size >=4 && !memcmp("Q264", buf, 4);
270  int field_poc[2];
271  int ret;
272 
273  /* set some sane default values */
274  s->pict_type = AV_PICTURE_TYPE_I;
275  s->key_frame = 0;
276  s->picture_structure = AV_PICTURE_STRUCTURE_UNKNOWN;
277 
278  ff_h264_sei_uninit(&p->sei);
279  p->sei.common.frame_packing.arrangement_cancel_flag = -1;
280  p->sei.common.unregistered.x264_build = -1;
281 
282  if (!buf_size)
283  return 0;
284 
286  if (!rbsp.rbsp_buffer)
287  return AVERROR(ENOMEM);
288 
289  buf_index = 0;
290  next_avc = p->is_avc ? 0 : buf_size;
291  for (;;) {
292  const SPS *sps;
293  int src_length, consumed, nalsize = 0;
294 
295  if (buf_index >= next_avc) {
296  nalsize = get_nalsize(p->nal_length_size, buf, buf_size, &buf_index, avctx);
297  if (nalsize < 0)
298  break;
299  next_avc = buf_index + nalsize;
300  } else {
301  buf_index = find_start_code(buf, buf_size, buf_index, next_avc);
302  if (buf_index >= buf_size)
303  break;
304  if (buf_index >= next_avc)
305  continue;
306  }
307  src_length = next_avc - buf_index;
308 
309  state = buf[buf_index];
310  switch (state & 0x1f) {
311  case H264_NAL_SLICE:
312  case H264_NAL_IDR_SLICE:
313  // Do not walk the whole buffer just to decode slice header
314  if ((state & 0x1f) == H264_NAL_IDR_SLICE || ((state >> 5) & 0x3) == 0) {
315  /* IDR or disposable slice
316  * No need to decode many bytes because MMCOs shall not be present. */
317  if (src_length > 60)
318  src_length = 60;
319  } else {
320  /* To decode up to MMCOs */
321  if (src_length > 1000)
322  src_length = 1000;
323  }
324  break;
325  }
326  consumed = ff_h2645_extract_rbsp(buf + buf_index, src_length, &rbsp, &nal, 1);
327  if (consumed < 0)
328  break;
329 
330  buf_index += consumed;
331 
332  ret = init_get_bits8(&nal.gb, nal.data, nal.size);
333  if (ret < 0)
334  goto fail;
335  get_bits1(&nal.gb);
336  nal.ref_idc = get_bits(&nal.gb, 2);
337  nal.type = get_bits(&nal.gb, 5);
338 
339  switch (nal.type) {
340  case H264_NAL_SPS:
341  ff_h264_decode_seq_parameter_set(&nal.gb, avctx, &p->ps, 0);
342  break;
343  case H264_NAL_PPS:
344  ff_h264_decode_picture_parameter_set(&nal.gb, avctx, &p->ps,
345  nal.size_bits);
346  break;
347  case H264_NAL_SEI:
348  ff_h264_sei_decode(&p->sei, &nal.gb, &p->ps, avctx);
349  break;
350  case H264_NAL_IDR_SLICE:
351  s->key_frame = 1;
352 
353  p->poc.prev_frame_num = 0;
354  p->poc.prev_frame_num_offset = 0;
355  p->poc.prev_poc_msb =
356  p->poc.prev_poc_lsb = 0;
357  /* fall through */
358  case H264_NAL_SLICE:
359  get_ue_golomb_long(&nal.gb); // skip first_mb_in_slice
360  slice_type = get_ue_golomb_31(&nal.gb);
361  s->pict_type = ff_h264_golomb_to_pict_type[slice_type % 5];
362  if (p->sei.recovery_point.recovery_frame_cnt >= 0) {
363  /* key frame, since recovery_frame_cnt is set */
364  s->key_frame = 1;
365  }
366  pps_id = get_ue_golomb(&nal.gb);
367  if (pps_id >= MAX_PPS_COUNT) {
368  av_log(avctx, AV_LOG_ERROR,
369  "pps_id %u out of range\n", pps_id);
370  goto fail;
371  }
372  if (!p->ps.pps_list[pps_id]) {
373  av_log(avctx, AV_LOG_ERROR,
374  "non-existing PPS %u referenced\n", pps_id);
375  goto fail;
376  }
377 
378  av_refstruct_replace(&p->ps.pps, p->ps.pps_list[pps_id]);
379  p->ps.sps = p->ps.pps->sps;
380  sps = p->ps.sps;
381 
382  // heuristic to detect non marked keyframes
383  if (p->ps.sps->ref_frame_count <= 1 && p->ps.pps->ref_count[0] <= 1 && s->pict_type == AV_PICTURE_TYPE_I)
384  s->key_frame = 1;
385 
386  p->poc.frame_num = get_bits(&nal.gb, sps->log2_max_frame_num);
387 
388  s->coded_width = 16 * sps->mb_width;
389  s->coded_height = 16 * sps->mb_height;
390  s->width = s->coded_width - (sps->crop_right + sps->crop_left);
391  s->height = s->coded_height - (sps->crop_top + sps->crop_bottom);
392  if (s->width <= 0 || s->height <= 0) {
393  s->width = s->coded_width;
394  s->height = s->coded_height;
395  }
396 
397  switch (sps->bit_depth_luma) {
398  case 9:
399  if (sps->chroma_format_idc == 3) s->format = AV_PIX_FMT_YUV444P9;
400  else if (sps->chroma_format_idc == 2) s->format = AV_PIX_FMT_YUV422P9;
401  else s->format = AV_PIX_FMT_YUV420P9;
402  break;
403  case 10:
404  if (sps->chroma_format_idc == 3) s->format = AV_PIX_FMT_YUV444P10;
405  else if (sps->chroma_format_idc == 2) s->format = AV_PIX_FMT_YUV422P10;
406  else s->format = AV_PIX_FMT_YUV420P10;
407  break;
408  case 8:
409  if (sps->chroma_format_idc == 3) s->format = AV_PIX_FMT_YUV444P;
410  else if (sps->chroma_format_idc == 2) s->format = AV_PIX_FMT_YUV422P;
411  else s->format = AV_PIX_FMT_YUV420P;
412  break;
413  default:
414  s->format = AV_PIX_FMT_NONE;
415  }
416 
417  avctx->profile = ff_h264_get_profile(sps);
418  avctx->level = sps->level_idc;
419 
420  if (sps->frame_mbs_only_flag) {
421  p->picture_structure = PICT_FRAME;
422  } else {
423  if (get_bits1(&nal.gb)) { // field_pic_flag
424  p->picture_structure = PICT_TOP_FIELD + get_bits1(&nal.gb); // bottom_field_flag
425  } else {
426  p->picture_structure = PICT_FRAME;
427  }
428  }
429 
430  if (nal.type == H264_NAL_IDR_SLICE)
431  get_ue_golomb_long(&nal.gb); /* idr_pic_id */
432  if (sps->poc_type == 0) {
433  p->poc.poc_lsb = get_bits(&nal.gb, sps->log2_max_poc_lsb);
434 
435  if (p->ps.pps->pic_order_present == 1 &&
436  p->picture_structure == PICT_FRAME)
437  p->poc.delta_poc_bottom = get_se_golomb(&nal.gb);
438  }
439 
440  if (sps->poc_type == 1 &&
441  !sps->delta_pic_order_always_zero_flag) {
442  p->poc.delta_poc[0] = get_se_golomb(&nal.gb);
443 
444  if (p->ps.pps->pic_order_present == 1 &&
445  p->picture_structure == PICT_FRAME)
446  p->poc.delta_poc[1] = get_se_golomb(&nal.gb);
447  }
448 
449  /* Decode POC of this picture.
450  * The prev_ values needed for decoding POC of the next picture are not set here. */
451  field_poc[0] = field_poc[1] = INT_MAX;
452  ret = ff_h264_init_poc(field_poc, &s->output_picture_number, sps,
453  &p->poc, p->picture_structure, nal.ref_idc);
454  if (ret < 0)
455  goto fail;
456 
457  /* Continue parsing to check if MMCO_RESET is present.
458  * FIXME: MMCO_RESET could appear in non-first slice.
459  * Maybe, we should parse all undisposable non-IDR slice of this
460  * picture until encountering MMCO_RESET in a slice of it. */
461  if (nal.ref_idc && nal.type != H264_NAL_IDR_SLICE) {
462  got_reset = scan_mmco_reset(s, &nal.gb, avctx);
463  if (got_reset < 0)
464  goto fail;
465  }
466 
467  /* Set up the prev_ values for decoding POC of the next picture. */
468  p->poc.prev_frame_num = got_reset ? 0 : p->poc.frame_num;
469  p->poc.prev_frame_num_offset = got_reset ? 0 : p->poc.frame_num_offset;
470  if (nal.ref_idc != 0) {
471  if (!got_reset) {
472  p->poc.prev_poc_msb = p->poc.poc_msb;
473  p->poc.prev_poc_lsb = p->poc.poc_lsb;
474  } else {
475  p->poc.prev_poc_msb = 0;
476  p->poc.prev_poc_lsb =
477  p->picture_structure == PICT_BOTTOM_FIELD ? 0 : field_poc[0];
478  }
479  }
480 
481  if (p->sei.picture_timing.present) {
482  ret = ff_h264_sei_process_picture_timing(&p->sei.picture_timing,
483  sps, avctx);
484  if (ret < 0) {
485  av_log(avctx, AV_LOG_ERROR, "Error processing the picture timing SEI\n");
486  p->sei.picture_timing.present = 0;
487  }
488  }
489 
490  if (sps->pic_struct_present_flag && p->sei.picture_timing.present) {
491  switch (p->sei.picture_timing.pic_struct) {
494  s->repeat_pict = 0;
495  break;
499  s->repeat_pict = 1;
500  break;
503  s->repeat_pict = 2;
504  break;
506  s->repeat_pict = 3;
507  break;
509  s->repeat_pict = 5;
510  break;
511  default:
512  s->repeat_pict = p->picture_structure == PICT_FRAME ? 1 : 0;
513  break;
514  }
515  } else {
516  s->repeat_pict = p->picture_structure == PICT_FRAME ? 1 : 0;
517  }
518 
519  if (p->picture_structure == PICT_FRAME) {
520  s->picture_structure = AV_PICTURE_STRUCTURE_FRAME;
521  if (sps->pic_struct_present_flag && p->sei.picture_timing.present) {
522  switch (p->sei.picture_timing.pic_struct) {
525  s->field_order = AV_FIELD_TT;
526  break;
529  s->field_order = AV_FIELD_BB;
530  break;
531  default:
532  s->field_order = AV_FIELD_PROGRESSIVE;
533  break;
534  }
535  } else {
536  if (field_poc[0] < field_poc[1])
537  s->field_order = AV_FIELD_TT;
538  else if (field_poc[0] > field_poc[1])
539  s->field_order = AV_FIELD_BB;
540  else
541  s->field_order = AV_FIELD_PROGRESSIVE;
542  }
543  } else {
544  if (p->picture_structure == PICT_TOP_FIELD)
545  s->picture_structure = AV_PICTURE_STRUCTURE_TOP_FIELD;
546  else
547  s->picture_structure = AV_PICTURE_STRUCTURE_BOTTOM_FIELD;
548  if (p->poc.frame_num == p->last_frame_num &&
549  p->last_picture_structure != AV_PICTURE_STRUCTURE_UNKNOWN &&
550  p->last_picture_structure != AV_PICTURE_STRUCTURE_FRAME &&
551  p->last_picture_structure != s->picture_structure) {
552  if (p->last_picture_structure == AV_PICTURE_STRUCTURE_TOP_FIELD)
553  s->field_order = AV_FIELD_TT;
554  else
555  s->field_order = AV_FIELD_BB;
556  } else {
557  s->field_order = AV_FIELD_UNKNOWN;
558  }
559  p->last_picture_structure = s->picture_structure;
560  p->last_frame_num = p->poc.frame_num;
561  }
562  if (sps->timing_info_present_flag) {
563  int64_t den = sps->time_scale;
564  if (p->sei.common.unregistered.x264_build < 44U)
565  den *= 2;
566  av_reduce(&avctx->framerate.den, &avctx->framerate.num,
567  sps->num_units_in_tick * 2, den, 1 << 30);
568  }
569 
570  av_freep(&rbsp.rbsp_buffer);
571  return 0; /* no need to evaluate the rest */
572  }
573  }
574  if (q264) {
575  av_freep(&rbsp.rbsp_buffer);
576  return 0;
577  }
578  /* didn't find a picture! */
579  av_log(avctx, AV_LOG_ERROR, "missing picture in access unit with size %d\n", buf_size);
580 fail:
581  av_freep(&rbsp.rbsp_buffer);
582  return -1;
583 }
584 
586  AVCodecContext *avctx,
587  const uint8_t **poutbuf, int *poutbuf_size,
588  const uint8_t *buf, int buf_size)
589 {
590  H264ParseContext *p = s->priv_data;
591  ParseContext *pc = &p->pc;
592  AVRational time_base = { 0, 1 };
593  int next;
594 
595  if (!p->got_first) {
596  p->got_first = 1;
597  if (avctx->extradata_size) {
599  &p->ps, &p->is_avc, &p->nal_length_size,
600  avctx->err_recognition, avctx);
601  }
602  }
603 
604  if (s->flags & PARSER_FLAG_COMPLETE_FRAMES) {
605  next = buf_size;
606  } else {
607  next = h264_find_frame_end(p, buf, buf_size, avctx);
608 
609  if (ff_combine_frame(pc, next, &buf, &buf_size) < 0) {
610  *poutbuf = NULL;
611  *poutbuf_size = 0;
612  return buf_size;
613  }
614 
615  if (next < 0 && next != END_NOT_FOUND) {
616  av_assert1(pc->last_index + next >= 0);
617  h264_find_frame_end(p, &pc->buffer[pc->last_index + next], -next, avctx); // update state
618  }
619  }
620 
621  parse_nal_units(s, avctx, buf, buf_size);
622 
623  if (avctx->framerate.num)
624  time_base = av_inv_q(av_mul_q(avctx->framerate, (AVRational){2, 1}));
625  if (p->sei.picture_timing.cpb_removal_delay >= 0) {
626  s->dts_sync_point = p->sei.buffering_period.present;
627  s->dts_ref_dts_delta = p->sei.picture_timing.cpb_removal_delay;
628  s->pts_dts_delta = p->sei.picture_timing.dpb_output_delay;
629  } else {
630  s->dts_sync_point = INT_MIN;
631  s->dts_ref_dts_delta = INT_MIN;
632  s->pts_dts_delta = INT_MIN;
633  }
634 
635  if (s->flags & PARSER_FLAG_ONCE) {
636  s->flags &= PARSER_FLAG_COMPLETE_FRAMES;
637  }
638 
639  if (s->dts_sync_point >= 0) {
640  int64_t den = time_base.den * (int64_t)avctx->pkt_timebase.num;
641  if (den > 0) {
642  int64_t num = time_base.num * (int64_t)avctx->pkt_timebase.den;
643  if (s->dts != AV_NOPTS_VALUE) {
644  // got DTS from the stream, update reference timestamp
645  p->reference_dts = av_sat_sub64(s->dts, av_rescale(s->dts_ref_dts_delta, num, den));
646  } else if (p->reference_dts != AV_NOPTS_VALUE) {
647  // compute DTS based on reference timestamp
648  s->dts = av_sat_add64(p->reference_dts, av_rescale(s->dts_ref_dts_delta, num, den));
649  }
650 
651  if (p->reference_dts != AV_NOPTS_VALUE && s->pts == AV_NOPTS_VALUE)
652  s->pts = s->dts + av_rescale(s->pts_dts_delta, num, den);
653 
654  if (s->dts_sync_point > 0)
655  p->reference_dts = s->dts; // new reference
656  }
657  }
658 
659  *poutbuf = buf;
660  *poutbuf_size = buf_size;
661  return next;
662 }
663 
665 {
666  H264ParseContext *p = s->priv_data;
667  ParseContext *pc = &p->pc;
668 
669  av_freep(&pc->buffer);
670 
671  ff_h264_sei_uninit(&p->sei);
672  ff_h264_ps_uninit(&p->ps);
673 }
674 
676 {
677  H264ParseContext *p = s->priv_data;
678 
679  p->reference_dts = AV_NOPTS_VALUE;
680  p->last_frame_num = INT_MAX;
681  ff_h264dsp_init(&p->h264dsp, 8, 1);
682  return 0;
683 }
684 
687  .priv_data_size = sizeof(H264ParseContext),
688  .parser_init = init,
689  .parser_parse = h264_parse,
690  .parser_close = h264_close,
691 };
MMCO_LONG2UNUSED
@ MMCO_LONG2UNUSED
Definition: h264_parse.h:62
PICT_FRAME
#define PICT_FRAME
Definition: mpegutils.h:33
H264ParseContext
Definition: h264_parser.c:54
MMCO_LONG
@ MMCO_LONG
Definition: h264_parse.h:66
ff_h264_sei_uninit
void ff_h264_sei_uninit(H264SEIContext *h)
Reset SEI values at the beginning of the frame.
Definition: h264_sei.c:48
h2645_parse.h
get_bits_left
static int get_bits_left(GetBitContext *gb)
Definition: get_bits.h:689
AVERROR
Filter the word β€œframe” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
H264ParseContext::sei
H264SEIContext sei
Definition: h264_parser.c:59
ff_h264_ps_uninit
void ff_h264_ps_uninit(H264ParamSets *ps)
Uninit H264 param sets structure.
Definition: h264_ps.c:270
h264_close
static av_cold void h264_close(AVCodecParserContext *s)
Definition: h264_parser.c:664
H264ParseContext::parse_last_mb
int parse_last_mb
Definition: h264_parser.c:66
AV_FIELD_PROGRESSIVE
@ AV_FIELD_PROGRESSIVE
Definition: defs.h:213
AV_PICTURE_STRUCTURE_UNKNOWN
@ AV_PICTURE_STRUCTURE_UNKNOWN
unknown
Definition: avcodec.h:2569
AVCodecContext::err_recognition
int err_recognition
Error recognition; may misdetect some more or less valid parts as errors.
Definition: avcodec.h:1398
int64_t
long long int64_t
Definition: coverity.c:34
H264ParseContext::is_avc
int is_avc
Definition: h264_parser.c:60
H264_SEI_PIC_STRUCT_TOP_BOTTOM
@ H264_SEI_PIC_STRUCT_TOP_BOTTOM
3: top field, bottom field, in that order
Definition: h264_sei.h:35
H2645NAL::ref_idc
int ref_idc
H.264 only, nal_ref_idc.
Definition: h2645_parse.h:57
scan_mmco_reset
static int scan_mmco_reset(AVCodecParserContext *s, GetBitContext *gb, void *logctx)
Definition: h264_parser.c:172
h264_parse.h
get_ue_golomb
static int get_ue_golomb(GetBitContext *gb)
Read an unsigned Exp-Golomb code in the range 0 to 8190.
Definition: golomb.h:53
state
static struct @527 state
H264ParseContext::parse_history
uint8_t parse_history[6]
Definition: h264_parser.c:64
AV_PIX_FMT_YUV420P10
#define AV_PIX_FMT_YUV420P10
Definition: pixfmt.h:539
PICT_BOTTOM_FIELD
#define PICT_BOTTOM_FIELD
Definition: mpegutils.h:32
ff_h264_pred_weight_table
int ff_h264_pred_weight_table(GetBitContext *gb, const SPS *sps, const int *ref_count, int slice_type_nos, H264PredWeightTable *pwt, int picture_structure, void *logctx)
Definition: h264_parse.c:30
H264ParseContext::picture_structure
int picture_structure
Definition: h264_parser.c:63
mpegutils.h
MMCOOpcode
MMCOOpcode
Memory management control operation opcode.
Definition: h264_parse.h:59
ParseContext::state
uint32_t state
contains the last few bytes in MSB order
Definition: parser.h:33
init_get_bits
static int init_get_bits(GetBitContext *s, const uint8_t *buffer, int bit_size)
Initialize GetBitContext.
Definition: get_bits.h:512
ParseContext::last_index
int last_index
Definition: parser.h:31
H264ParseContext::got_first
int got_first
Definition: h264_parser.c:62
H2645NAL::size_bits
int size_bits
Size, in bits, of just the data, excluding the stop bit and any trailing padding.
Definition: h2645_parse.h:42
ff_h264_decode_picture_parameter_set
int ff_h264_decode_picture_parameter_set(GetBitContext *gb, AVCodecContext *avctx, H264ParamSets *ps, int bit_length)
Decode PPS.
Definition: h264_ps.c:696
MMCO_SET_MAX_LONG
@ MMCO_SET_MAX_LONG
Definition: h264_parse.h:64
AVCodecContext::framerate
AVRational framerate
Definition: avcodec.h:551
golomb.h
exp golomb vlc stuff
get_bits
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:333
AV_FIELD_TT
@ AV_FIELD_TT
Top coded_first, top displayed first.
Definition: defs.h:214
ParseContext
Definition: parser.h:28
H264ParseContext::h264dsp
H264DSPContext h264dsp
Definition: h264_parser.c:57
fail
#define fail()
Definition: checkasm.h:203
H264_MAX_MMCO_COUNT
@ H264_MAX_MMCO_COUNT
Definition: h264.h:92
ff_h264_sei_decode
int ff_h264_sei_decode(H264SEIContext *h, GetBitContext *gb, const H264ParamSets *ps, void *logctx)
Definition: h264_sei.c:230
H264_NAL_SLICE
@ H264_NAL_SLICE
Definition: h264.h:35
GetBitContext
Definition: get_bits.h:109
AV_PIX_FMT_YUV422P9
#define AV_PIX_FMT_YUV422P9
Definition: pixfmt.h:537
ff_h264_sei_process_picture_timing
int ff_h264_sei_process_picture_timing(H264SEIPictureTiming *h, const SPS *sps, void *logctx)
Parse the contents of a picture timing message given an active SPS.
Definition: h264_sei.c:64
ff_h264_golomb_to_pict_type
const uint8_t ff_h264_golomb_to_pict_type[5]
Definition: h264data.c:37
av_reduce
int av_reduce(int *dst_num, int *dst_den, int64_t num, int64_t den, int64_t max)
Reduce a fraction.
Definition: rational.c:35
AVRational::num
int num
Numerator.
Definition: rational.h:59
parse_nal_units
static int parse_nal_units(AVCodecParserContext *s, AVCodecContext *avctx, const uint8_t *const buf, int buf_size)
Parse NAL units of found picture and decode some basic information.
Definition: h264_parser.c:258
refstruct.h
h264_parse
static int h264_parse(AVCodecParserContext *s, AVCodecContext *avctx, const uint8_t **poutbuf, int *poutbuf_size, const uint8_t *buf, int buf_size)
Definition: h264_parser.c:585
AV_PIX_FMT_YUV444P10
#define AV_PIX_FMT_YUV444P10
Definition: pixfmt.h:542
ParseContext::buffer
uint8_t * buffer
Definition: parser.h:29
AV_PICTURE_STRUCTURE_FRAME
@ AV_PICTURE_STRUCTURE_FRAME
coded as frame
Definition: avcodec.h:2572
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:210
av_cold
#define av_cold
Definition: attributes.h:100
init_get_bits8
static int init_get_bits8(GetBitContext *s, const uint8_t *buffer, int byte_size)
Initialize GetBitContext.
Definition: get_bits.h:539
AV_FIELD_UNKNOWN
@ AV_FIELD_UNKNOWN
Definition: defs.h:212
H2645NAL::size
int size
Definition: h2645_parse.h:36
AVCodecContext::extradata_size
int extradata_size
Definition: avcodec.h:515
s
#define s(width, name)
Definition: cbs_vp9.c:198
ff_h264_decode_extradata
int ff_h264_decode_extradata(const uint8_t *data, int size, H264ParamSets *ps, int *is_avc, int *nal_length_size, int err_recognition, void *logctx)
Definition: h264_parse.c:466
h264data.h
AV_PIX_FMT_YUV420P9
#define AV_PIX_FMT_YUV420P9
Definition: pixfmt.h:536
PICT_TOP_FIELD
#define PICT_TOP_FIELD
Definition: mpegutils.h:31
get_bits.h
H2645NAL::data
const uint8_t * data
Definition: h2645_parse.h:35
AV_PIX_FMT_YUV420P
@ AV_PIX_FMT_YUV420P
planar YUV 4:2:0, 12bpp, (1 Cr & Cb sample per 2x2 Y samples)
Definition: pixfmt.h:73
get_se_golomb
static int get_se_golomb(GetBitContext *gb)
read signed exp golomb code.
Definition: golomb.h:239
AV_CODEC_ID_H264
@ AV_CODEC_ID_H264
Definition: codec_id.h:79
H2645NAL::type
int type
NAL unit type.
Definition: h2645_parse.h:52
H264_NAL_SPS
@ H264_NAL_SPS
Definition: h264.h:41
if
if(ret)
Definition: filter_design.txt:179
AV_PICTURE_STRUCTURE_BOTTOM_FIELD
@ AV_PICTURE_STRUCTURE_BOTTOM_FIELD
coded as bottom field
Definition: avcodec.h:2571
NULL
#define NULL
Definition: coverity.c:32
H264SEIContext
Definition: h264_sei.h:119
AVRational
Rational number (pair of numerator and denominator).
Definition: rational.h:58
SPS
Sequence parameter set.
Definition: h264_ps.h:44
AV_PICTURE_STRUCTURE_TOP_FIELD
@ AV_PICTURE_STRUCTURE_TOP_FIELD
coded as top field
Definition: avcodec.h:2570
H264_NAL_AUD
@ H264_NAL_AUD
Definition: h264.h:43
AV_PICTURE_TYPE_I
@ AV_PICTURE_TYPE_I
Intra.
Definition: avutil.h:278
get_bits1
static unsigned int get_bits1(GetBitContext *s)
Definition: get_bits.h:386
h264dsp.h
ParseContext::frame_start_found
int frame_start_found
Definition: parser.h:34
list
Filter the word β€œframe” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining list
Definition: filter_design.txt:25
avpriv_find_start_code
const uint8_t * avpriv_find_start_code(const uint8_t *p, const uint8_t *end, uint32_t *state)
MAX_PPS_COUNT
#define MAX_PPS_COUNT
Definition: h264_ps.h:38
AV_PIX_FMT_YUV422P10
#define AV_PIX_FMT_YUV422P10
Definition: pixfmt.h:540
AVCodecContext::level
int level
Encoding level descriptor.
Definition: avcodec.h:1628
h264_find_frame_end
static int h264_find_frame_end(H264ParseContext *p, const uint8_t *buf, int buf_size, void *logctx)
Definition: h264_parser.c:81
h264_ps.h
index
int index
Definition: gxfenc.c:90
error.h
H264_SEI_PIC_STRUCT_BOTTOM_TOP_BOTTOM
@ H264_SEI_PIC_STRUCT_BOTTOM_TOP_BOTTOM
6: bottom field, top field, bottom field repeated, in that order
Definition: h264_sei.h:38
H2645RBSP::rbsp_buffer
uint8_t * rbsp_buffer
Definition: h2645_parse.h:75
startcode.h
H264DSPContext
Context for storing H.264 DSP functions.
Definition: h264dsp.h:42
av_sat_sub64
#define av_sat_sub64
Definition: common.h:142
MMCO_END
@ MMCO_END
Definition: h264_parse.h:60
AVCodecParser::codec_ids
int codec_ids[7]
Definition: avcodec.h:2735
H264_NAL_PPS
@ H264_NAL_PPS
Definition: h264.h:42
AVCodecContext::pkt_timebase
AVRational pkt_timebase
Timebase in which pkt_dts/pts and AVPacket.dts/pts are expressed.
Definition: avcodec.h:542
AV_NOPTS_VALUE
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:247
H264_SEI_PIC_STRUCT_BOTTOM_TOP
@ H264_SEI_PIC_STRUCT_BOTTOM_TOP
4: bottom field, top field, in that order
Definition: h264_sei.h:36
H2645NAL::gb
GetBitContext gb
Definition: h2645_parse.h:47
MMCO_SHORT2UNUSED
@ MMCO_SHORT2UNUSED
Definition: h264_parse.h:61
H2645NAL
Definition: h2645_parse.h:34
MMCO_RESET
@ MMCO_RESET
Definition: h264_parse.h:65
H264ParseContext::parse_history_count
int parse_history_count
Definition: h264_parser.c:65
ff_h264_parser
const AVCodecParser ff_h264_parser
Definition: h264_parser.c:685
H264ParseContext::last_frame_num
int last_frame_num
Definition: h264_parser.c:68
attributes.h
mb
#define mb
Definition: vf_colormatrix.c:99
ff_combine_frame
int ff_combine_frame(ParseContext *pc, int next, const uint8_t **buf, int *buf_size)
Combine the (truncated) bitstream to a complete frame.
Definition: parser.c:204
H264_SEI_PIC_STRUCT_FRAME
@ H264_SEI_PIC_STRUCT_FRAME
0: frame
Definition: h264_sei.h:32
H264_SEI_PIC_STRUCT_FRAME_TRIPLING
@ H264_SEI_PIC_STRUCT_FRAME_TRIPLING
8: frame tripling
Definition: h264_sei.h:40
h264_sei.h
ff_h264_decode_seq_parameter_set
int ff_h264_decode_seq_parameter_set(GetBitContext *gb, AVCodecContext *avctx, H264ParamSets *ps, int ignore_truncation)
Decode SPS.
Definition: h264_ps.c:284
log.h
PARSER_FLAG_COMPLETE_FRAMES
#define PARSER_FLAG_COMPLETE_FRAMES
Definition: avcodec.h:2609
MMCO_SHORT2LONG
@ MMCO_SHORT2LONG
Definition: h264_parse.h:63
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:256
H264_SEI_PIC_STRUCT_FRAME_DOUBLING
@ H264_SEI_PIC_STRUCT_FRAME_DOUBLING
7: frame doubling
Definition: h264_sei.h:39
AVCodecContext::extradata
uint8_t * extradata
Out-of-band global headers that may be used by some codecs.
Definition: avcodec.h:514
ff_h2645_extract_rbsp
int ff_h2645_extract_rbsp(const uint8_t *src, int length, H2645RBSP *rbsp, H2645NAL *nal, int small_padding)
Extract the raw (unescaped) bitstream.
Definition: h2645_parse.c:37
H264POCContext
Definition: h264_parse.h:82
AV_FIELD_BB
@ AV_FIELD_BB
Bottom coded first, bottom displayed first.
Definition: defs.h:215
av_assert1
#define av_assert1(cond)
assert() equivalent, that does not lie in speed critical code.
Definition: avassert.h:57
av_fast_padded_malloc
void av_fast_padded_malloc(void *ptr, unsigned int *size, size_t min_size)
Same behaviour av_fast_malloc but the buffer has additional AV_INPUT_BUFFER_PADDING_SIZE at the end w...
Definition: utils.c:53
FFMIN
#define FFMIN(a, b)
Definition: macros.h:49
av_inv_q
static av_always_inline AVRational av_inv_q(AVRational q)
Invert a rational.
Definition: rational.h:159
parser.h
ff_h264_parse_ref_count
int ff_h264_parse_ref_count(int *plist_count, int ref_count[2], GetBitContext *gb, const PPS *pps, int slice_type_nos, int picture_structure, void *logctx)
Definition: h264_parse.c:222
av_rescale
int64_t av_rescale(int64_t a, int64_t b, int64_t c)
Rescale a 64-bit integer with rounding to nearest.
Definition: mathematics.c:129
H264ParseContext::last_picture_structure
int last_picture_structure
Definition: h264_parser.c:68
AV_PIX_FMT_YUV444P9
#define AV_PIX_FMT_YUV444P9
Definition: pixfmt.h:538
H2645RBSP::rbsp_buffer_alloc_size
int rbsp_buffer_alloc_size
Definition: h2645_parse.h:77
avcodec.h
AVCodecParserContext
Definition: avcodec.h:2575
ff_h264dsp_init
av_cold void ff_h264dsp_init(H264DSPContext *c, const int bit_depth, const int chroma_format_idc)
Definition: h264dsp.c:66
ret
ret
Definition: filter_design.txt:187
ff_h264_init_poc
int ff_h264_init_poc(int pic_field_poc[2], int *pic_poc, const SPS *sps, H264POCContext *pc, int picture_structure, int nal_ref_idc)
Definition: h264_parse.c:280
pixfmt.h
ff_h264_get_profile
int ff_h264_get_profile(const SPS *sps)
Compute profile from profile_idc and constraint_set?_flags.
Definition: h264_parse.c:533
H264_NAL_SEI
@ H264_NAL_SEI
Definition: h264.h:40
sps
static int FUNC() sps(CodedBitstreamContext *ctx, RWContext *rw, H264RawSPS *current)
Definition: cbs_h264_syntax_template.c:260
av_sat_add64
#define av_sat_add64
Definition: common.h:139
U
#define U(x)
Definition: vpx_arith.h:37
AVCodecContext
main external API structure.
Definition: avcodec.h:431
get_ue_golomb_31
static int get_ue_golomb_31(GetBitContext *gb)
read unsigned exp golomb code, constraint to a max of 31.
Definition: golomb.h:120
find_start_code
static int find_start_code(const uint8_t *buf, int buf_size, int buf_index, int next_avc)
Definition: h264_parser.c:71
AV_PICTURE_TYPE_B
@ AV_PICTURE_TYPE_B
Bi-dir predicted.
Definition: avutil.h:280
av_refstruct_replace
void av_refstruct_replace(void *dstp, const void *src)
Ensure *dstp refers to the same object as src.
Definition: refstruct.c:160
AVRational::den
int den
Denominator.
Definition: rational.h:60
AV_PIX_FMT_NONE
@ AV_PIX_FMT_NONE
Definition: pixfmt.h:72
H264ParseContext::nal_length_size
int nal_length_size
Definition: h264_parser.c:61
AVCodecContext::profile
int profile
profile
Definition: avcodec.h:1618
H264ParamSets
Definition: h264_ps.h:144
Windows::Graphics::DirectX::Direct3D11::p
IDirect3DDxgiInterfaceAccess _COM_Outptr_ void ** p
Definition: vsrc_gfxcapture_winrt.hpp:53
av_mul_q
AVRational av_mul_q(AVRational b, AVRational c)
Multiply two rationals.
Definition: rational.c:80
H264PredWeightTable
Definition: h264_parse.h:69
AV_PIX_FMT_YUV444P
@ AV_PIX_FMT_YUV444P
planar YUV 4:4:4, 24bpp, (1 Cr & Cb sample per 1x1 Y samples)
Definition: pixfmt.h:78
AV_PICTURE_TYPE_P
@ AV_PICTURE_TYPE_P
Predicted.
Definition: avutil.h:279
avutil.h
AV_PIX_FMT_YUV422P
@ AV_PIX_FMT_YUV422P
planar YUV 4:2:2, 16bpp, (1 Cr & Cb sample per 2x1 Y samples)
Definition: pixfmt.h:77
mem.h
init
static av_cold int init(AVCodecParserContext *s)
Definition: h264_parser.c:675
get_ue_golomb_long
static unsigned get_ue_golomb_long(GetBitContext *gb)
Read an unsigned Exp-Golomb code in the range 0 to UINT32_MAX-1.
Definition: golomb.h:104
H264_SEI_PIC_STRUCT_BOTTOM_FIELD
@ H264_SEI_PIC_STRUCT_BOTTOM_FIELD
2: bottom field
Definition: h264_sei.h:34
H264ParseContext::ps
H264ParamSets ps
Definition: h264_parser.c:56
H264ParseContext::poc
H264POCContext poc
Definition: h264_parser.c:58
END_NOT_FOUND
#define END_NOT_FOUND
Definition: parser.h:40
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35
H264_NAL_DPA
@ H264_NAL_DPA
Definition: h264.h:36
AVCodecParser
Definition: avcodec.h:2734
h264.h
get_nalsize
static int get_nalsize(int nal_length_size, const uint8_t *buf, int buf_size, int *buf_index, void *logctx)
Definition: h2645_parse.h:126
H264ParseContext::reference_dts
int64_t reference_dts
Definition: h264_parser.c:67
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:27
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
PARSER_FLAG_ONCE
#define PARSER_FLAG_ONCE
Definition: avcodec.h:2610
H2645RBSP
Definition: h2645_parse.h:74
H264_NAL_IDR_SLICE
@ H264_NAL_IDR_SLICE
Definition: h264.h:39
H264_SEI_PIC_STRUCT_TOP_FIELD
@ H264_SEI_PIC_STRUCT_TOP_FIELD
1: top field
Definition: h264_sei.h:33
H264_SEI_PIC_STRUCT_TOP_BOTTOM_TOP
@ H264_SEI_PIC_STRUCT_TOP_BOTTOM_TOP
5: top field, bottom field, top field repeated, in that order
Definition: h264_sei.h:37
H264ParseContext::pc
ParseContext pc
Definition: h264_parser.c:55