FFmpeg
h264_mp4toannexb_bsf.c
Go to the documentation of this file.
1 /*
2  * H.264 MP4 to Annex B byte stream format filter
3  * Copyright (c) 2007 Benoit Fouet <benoit.fouet@free.fr>
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include <string.h>
23 
24 #include "libavutil/avassert.h"
25 #include "libavutil/intreadwrite.h"
26 #include "libavutil/mem.h"
27 
28 #include "bsf.h"
29 #include "bsf_internal.h"
30 #include "bytestream.h"
31 #include "defs.h"
32 #include "h264.h"
33 
34 typedef struct H264BSFContext {
35  uint8_t *sps;
36  uint8_t *pps;
37  int sps_size;
38  int pps_size;
39  uint8_t length_size;
40  uint8_t new_idr;
41  uint8_t idr_sps_seen;
42  uint8_t idr_pps_seen;
45 
46 static void count_or_copy(uint8_t **out, uint64_t *out_size,
47  const uint8_t *in, int in_size, int ps, int copy)
48 {
49  uint8_t start_code_size = ps < 0 ? 0 : *out_size == 0 || ps ? 4 : 3;
50 
51  if (copy) {
52  memcpy(*out + start_code_size, in, in_size);
53  if (start_code_size == 4) {
54  AV_WB32(*out, 1);
55  } else if (start_code_size) {
56  (*out)[0] =
57  (*out)[1] = 0;
58  (*out)[2] = 1;
59  }
60  *out += start_code_size + in_size;
61  }
62  *out_size += start_code_size + in_size;
63 }
64 
65 static int h264_extradata_to_annexb(AVBSFContext *ctx, const int padding)
66 {
68  GetByteContext ogb, *gb = &ogb;
69  uint16_t unit_size;
70  uint32_t total_size = 0;
71  uint8_t *out = NULL, unit_nb, sps_done = 0;
72  static const uint8_t nalu_header[4] = { 0, 0, 0, 1 };
73  int length_size, pps_offset = 0;
74 
75  bytestream2_init(gb, ctx->par_in->extradata, ctx->par_in->extradata_size);
76 
77  bytestream2_skipu(gb, 4);
78 
79  /* retrieve length coded size */
80  length_size = (bytestream2_get_byteu(gb) & 0x3) + 1;
81 
82  /* retrieve sps and pps unit(s) */
83  unit_nb = bytestream2_get_byteu(gb) & 0x1f; /* number of sps unit(s) */
84  if (!unit_nb) {
85  goto pps;
86  }
87 
88  while (unit_nb--) {
89  int err;
90 
91  /* possible overread ok due to padding */
92  unit_size = bytestream2_get_be16u(gb);
93  total_size += unit_size + 4;
94  av_assert1(total_size <= INT_MAX - padding);
95  if (bytestream2_get_bytes_left(gb) < unit_size + !sps_done) {
96  av_log(ctx, AV_LOG_ERROR, "Global extradata truncated, "
97  "corrupted stream or invalid MP4/AVCC bitstream\n");
98  av_free(out);
99  return AVERROR_INVALIDDATA;
100  }
101  if ((err = av_reallocp(&out, total_size + padding)) < 0)
102  return err;
103  memcpy(out + total_size - unit_size - 4, nalu_header, 4);
104  bytestream2_get_bufferu(gb, out + total_size - unit_size, unit_size);
105 pps:
106  if (!unit_nb && !sps_done++) {
107  unit_nb = bytestream2_get_byteu(gb); /* number of pps unit(s) */
108  pps_offset = total_size;
109  }
110  }
111 
112  if (out)
113  memset(out + total_size, 0, padding);
114 
115  if (pps_offset) {
116  s->sps = out;
117  s->sps_size = pps_offset;
118  } else {
120  "Warning: SPS NALU missing or invalid. "
121  "The resulting stream may not play.\n");
122  }
123  if (pps_offset < total_size) {
124  s->pps = out + pps_offset;
125  s->pps_size = total_size - pps_offset;
126  } else {
128  "Warning: PPS NALU missing or invalid. "
129  "The resulting stream may not play.\n");
130  }
131 
132  av_freep(&ctx->par_out->extradata);
133  ctx->par_out->extradata = out;
134  ctx->par_out->extradata_size = total_size;
135 
136  return length_size;
137 }
138 
140 {
142  int extra_size = ctx->par_in->extradata_size;
143  int ret;
144 
145  /* retrieve sps and pps NAL units from extradata */
146  if (!extra_size ||
147  (extra_size >= 3 && AV_RB24(ctx->par_in->extradata) == 1) ||
148  (extra_size >= 4 && AV_RB32(ctx->par_in->extradata) == 1)) {
150  "The input looks like it is Annex B already\n");
151  } else if (extra_size >= 7) {
153  if (ret < 0)
154  return ret;
155 
156  s->length_size = ret;
157  s->new_idr = 1;
158  s->idr_sps_seen = 0;
159  s->idr_pps_seen = 0;
160  s->extradata_parsed = 1;
161  } else {
162  av_log(ctx, AV_LOG_ERROR, "Invalid extradata size: %d\n", extra_size);
163  return AVERROR_INVALIDDATA;
164  }
165 
166  return 0;
167 }
168 
170 {
172  AVPacket *in;
173  uint8_t unit_type, new_idr, sps_seen, pps_seen;
174  const uint8_t *buf;
175  const uint8_t *buf_end;
176  uint8_t *out;
177  uint64_t out_size;
178  int ret;
179 
180  ret = ff_bsf_get_packet(ctx, &in);
181  if (ret < 0)
182  return ret;
183 
184  /* nothing to filter */
185  if (!s->extradata_parsed) {
186  av_packet_move_ref(opkt, in);
187  av_packet_free(&in);
188  return 0;
189  }
190 
191  buf_end = in->data + in->size;
192 
193 #define LOG_ONCE(...) \
194  if (j) \
195  av_log(__VA_ARGS__)
196  for (int j = 0; j < 2; j++) {
197  buf = in->data;
198  new_idr = s->new_idr;
199  sps_seen = s->idr_sps_seen;
200  pps_seen = s->idr_pps_seen;
201  out_size = 0;
202 
203  do {
204  uint32_t nal_size = 0;
205 
206  /* possible overread ok due to padding */
207  for (int i = 0; i < s->length_size; i++)
208  nal_size = (nal_size << 8) | buf[i];
209 
210  buf += s->length_size;
211 
212  /* This check requires the cast as the right side might
213  * otherwise be promoted to an unsigned value. */
214  if ((int64_t)nal_size > buf_end - buf) {
216  goto fail;
217  }
218 
219  if (!nal_size)
220  continue;
221 
222  unit_type = *buf & 0x1f;
223 
224  if (unit_type == H264_NAL_SPS) {
225  sps_seen = new_idr = 1;
226  } else if (unit_type == H264_NAL_PPS) {
227  pps_seen = new_idr = 1;
228  /* if SPS has not been seen yet, prepend the AVCC one to PPS */
229  if (!sps_seen) {
230  if (!s->sps_size) {
231  LOG_ONCE(ctx, AV_LOG_WARNING, "SPS not present in the stream, nor in AVCC, stream may be unreadable\n");
232  } else {
233  count_or_copy(&out, &out_size, s->sps, s->sps_size, -1, j);
234  sps_seen = 1;
235  }
236  }
237  }
238 
239  /* If this is a new IDR picture following an IDR picture, reset the idr flag.
240  * Just check first_mb_in_slice to be 0 as this is the simplest solution.
241  * This could be checking idr_pic_id instead, but would complexify the parsing. */
242  if (!new_idr && unit_type == H264_NAL_IDR_SLICE && (buf[1] & 0x80))
243  new_idr = 1;
244 
245  /* prepend only to the first type 5 NAL unit of an IDR picture, if no sps/pps are already present */
246  if (new_idr && unit_type == H264_NAL_IDR_SLICE && !sps_seen && !pps_seen) {
247  if (ctx->par_out->extradata)
248  count_or_copy(&out, &out_size, ctx->par_out->extradata,
249  ctx->par_out->extradata_size, -1, j);
250  new_idr = 0;
251  /* if only SPS has been seen, also insert PPS */
252  } else if (new_idr && unit_type == H264_NAL_IDR_SLICE && sps_seen && !pps_seen) {
253  if (!s->pps_size) {
254  LOG_ONCE(ctx, AV_LOG_WARNING, "PPS not present in the stream, nor in AVCC, stream may be unreadable\n");
255  } else {
256  count_or_copy(&out, &out_size, s->pps, s->pps_size, -1, j);
257  }
258  }
259 
260  count_or_copy(&out, &out_size, buf, nal_size,
261  unit_type == H264_NAL_SPS || unit_type == H264_NAL_PPS, j);
262  if (!new_idr && unit_type == H264_NAL_SLICE) {
263  new_idr = 1;
264  sps_seen = 0;
265  pps_seen = 0;
266  }
267 
268  buf += nal_size;
269  } while (buf < buf_end);
270 
271  if (!j) {
272  if (out_size > INT_MAX - AV_INPUT_BUFFER_PADDING_SIZE) {
274  goto fail;
275  }
276  ret = av_new_packet(opkt, out_size);
277  if (ret < 0)
278  goto fail;
279  out = opkt->data;
280  }
281  }
282 #undef LOG_ONCE
283 
284  av_assert1(out_size == opkt->size);
285 
286  s->new_idr = new_idr;
287  s->idr_sps_seen = sps_seen;
288  s->idr_pps_seen = pps_seen;
289 
290  ret = av_packet_copy_props(opkt, in);
291  if (ret < 0)
292  goto fail;
293 
294 fail:
295  if (ret < 0)
296  av_packet_unref(opkt);
297  av_packet_free(&in);
298 
299  return ret;
300 }
301 
303 {
305 
306  s->idr_sps_seen = 0;
307  s->idr_pps_seen = 0;
308  s->new_idr = s->extradata_parsed;
309 }
310 
311 static const enum AVCodecID codec_ids[] = {
313 };
314 
316  .name = "h264_mp4toannexb",
317  .priv_data_size = sizeof(H264BSFContext),
321  .codec_ids = codec_ids,
322 };
av_packet_unref
void av_packet_unref(AVPacket *pkt)
Wipe the packet.
Definition: avpacket.c:424
AV_LOG_WARNING
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:186
H264_NAL_IDR_SLICE
@ H264_NAL_IDR_SLICE
Definition: h264.h:39
bsf_internal.h
out
FILE * out
Definition: movenc.c:54
GetByteContext
Definition: bytestream.h:33
H264BSFContext::sps
uint8_t * sps
Definition: h264_mp4toannexb_bsf.c:35
bytestream2_skipu
static av_always_inline void bytestream2_skipu(GetByteContext *g, unsigned int size)
Definition: bytestream.h:174
AVBitStreamFilter::name
const char * name
Definition: bsf.h:91
out_size
int out_size
Definition: movenc.c:55
AVPacket::data
uint8_t * data
Definition: packet.h:373
h264_mp4toannexb_filter
static int h264_mp4toannexb_filter(AVBSFContext *ctx, AVPacket *opkt)
Definition: h264_mp4toannexb_bsf.c:169
AV_LOG_VERBOSE
#define AV_LOG_VERBOSE
Detailed information.
Definition: log.h:196
H264BSFContext::extradata_parsed
int extradata_parsed
Definition: h264_mp4toannexb_bsf.c:43
filter
filter_frame For filters that do not use the this method is called when a frame is pushed to the filter s input It can be called at any time except in a reentrant way If the input frame is enough to produce then the filter should push the output frames on the output link immediately As an exception to the previous rule if the input frame is enough to produce several output frames then the filter needs output only at least one per link The additional frames can be left buffered in the filter
Definition: filter_design.txt:228
ff_bsf_get_packet
int ff_bsf_get_packet(AVBSFContext *ctx, AVPacket **pkt)
Called by the bitstream filters to get the next packet for filtering.
Definition: bsf.c:231
av_packet_free
void av_packet_free(AVPacket **pkt)
Free the packet, if the packet is reference counted, it will be unreferenced first.
Definition: avpacket.c:75
AVBSFContext
The bitstream filter state.
Definition: bsf.h:47
init
static int init
Definition: av_tx.c:47
bsf.h
h264_mp4toannexb_flush
static void h264_mp4toannexb_flush(AVBSFContext *ctx)
Definition: h264_mp4toannexb_bsf.c:302
H264BSFContext::idr_sps_seen
uint8_t idr_sps_seen
Definition: h264_mp4toannexb_bsf.c:41
fail
#define fail()
Definition: checkasm.h:127
avassert.h
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
H264_NAL_PPS
@ H264_NAL_PPS
Definition: h264.h:42
H264BSFContext::pps_size
int pps_size
Definition: h264_mp4toannexb_bsf.c:38
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:257
av_new_packet
int av_new_packet(AVPacket *pkt, int size)
Allocate the payload of a packet and initialize its fields with default values.
Definition: avpacket.c:99
codec_ids
static enum AVCodecID codec_ids[]
Definition: h264_mp4toannexb_bsf.c:311
ctx
AVFormatContext * ctx
Definition: movenc.c:48
H264BSFContext
Definition: h264_mp4toannexb_bsf.c:34
AV_CODEC_ID_H264
@ AV_CODEC_ID_H264
Definition: codec_id.h:77
flush
static void flush(AVCodecContext *avctx)
Definition: aacdec_template.c:593
NULL
#define NULL
Definition: coverity.c:32
ff_h264_mp4toannexb_bsf
const AVBitStreamFilter ff_h264_mp4toannexb_bsf
Definition: h264_mp4toannexb_bsf.c:315
av_packet_move_ref
void av_packet_move_ref(AVPacket *dst, AVPacket *src)
Move every field in src to dst and reset src.
Definition: avpacket.c:481
bytestream2_get_bytes_left
static av_always_inline int bytestream2_get_bytes_left(GetByteContext *g)
Definition: bytestream.h:158
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:47
AV_WB32
#define AV_WB32(p, v)
Definition: intreadwrite.h:419
AVPacket::size
int size
Definition: packet.h:374
copy
static void copy(const float *p1, float *p2, const int length)
Definition: vf_vaguedenoiser.c:187
pps
static int FUNC() pps(CodedBitstreamContext *ctx, RWContext *rw, H264RawPPS *current)
Definition: cbs_h264_syntax_template.c:404
av_reallocp
int av_reallocp(void *ptr, size_t size)
Allocate, reallocate, or free a block of memory through a pointer to a pointer.
Definition: mem.c:185
AV_RB32
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_WB64 unsigned int_TMPL AV_RB32
Definition: bytestream.h:96
h264_mp4toannexb_init
static int h264_mp4toannexb_init(AVBSFContext *ctx)
Definition: h264_mp4toannexb_bsf.c:139
H264_NAL_SPS
@ H264_NAL_SPS
Definition: h264.h:41
av_packet_copy_props
int av_packet_copy_props(AVPacket *dst, const AVPacket *src)
Copy only "properties" fields from src to dst.
Definition: avpacket.c:387
AV_CODEC_ID_NONE
@ AV_CODEC_ID_NONE
Definition: codec_id.h:48
i
#define i(width, name, range_min, range_max)
Definition: cbs_h2645.c:271
H264_NAL_SLICE
@ H264_NAL_SLICE
Definition: h264.h:35
H264BSFContext::length_size
uint8_t length_size
Definition: h264_mp4toannexb_bsf.c:39
av_assert1
#define av_assert1(cond)
assert() equivalent, that does not lie in speed critical code.
Definition: avassert.h:53
count_or_copy
static void count_or_copy(uint8_t **out, uint64_t *out_size, const uint8_t *in, int in_size, int ps, int copy)
Definition: h264_mp4toannexb_bsf.c:46
H264BSFContext::new_idr
uint8_t new_idr
Definition: h264_mp4toannexb_bsf.c:40
ret
ret
Definition: filter_design.txt:187
H264BSFContext::pps
uint8_t * pps
Definition: h264_mp4toannexb_bsf.c:36
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
LOG_ONCE
#define LOG_ONCE(...)
AVBitStreamFilter
Definition: bsf.h:90
defs.h
mem.h
bytestream2_get_bufferu
static av_always_inline unsigned int bytestream2_get_bufferu(GetByteContext *g, uint8_t *dst, unsigned int size)
Definition: bytestream.h:277
h264_extradata_to_annexb
static int h264_extradata_to_annexb(AVBSFContext *ctx, const int padding)
Definition: h264_mp4toannexb_bsf.c:65
av_free
#define av_free(p)
Definition: tableprint_vlc.h:34
AVPacket
This structure stores compressed data.
Definition: packet.h:350
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35
bytestream.h
h264.h
bytestream2_init
static av_always_inline void bytestream2_init(GetByteContext *g, const uint8_t *buf, int buf_size)
Definition: bytestream.h:137
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
AV_RB24
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_WB64 unsigned int_TMPL AV_WB32 unsigned int_TMPL AV_RB24
Definition: bytestream.h:97
H264BSFContext::sps_size
int sps_size
Definition: h264_mp4toannexb_bsf.c:37
AVFormatContext::priv_data
void * priv_data
Format private data.
Definition: avformat.h:1228
H264BSFContext::idr_pps_seen
uint8_t idr_pps_seen
Definition: h264_mp4toannexb_bsf.c:42