FFmpeg  4.0
h264_mp4toannexb_bsf.c
Go to the documentation of this file.
1 /*
2  * H.264 MP4 to Annex B byte stream format filter
3  * Copyright (c) 2007 Benoit Fouet <benoit.fouet@free.fr>
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include <string.h>
23 
24 #include "libavutil/intreadwrite.h"
25 #include "libavutil/mem.h"
26 
27 #include "avcodec.h"
28 #include "bsf.h"
29 
30 typedef struct H264BSFContext {
39 
41  const uint8_t *sps_pps, uint32_t sps_pps_size,
42  const uint8_t *in, uint32_t in_size, int ps)
43 {
44  uint32_t offset = out->size;
45  uint8_t start_code_size = offset == 0 || ps ? 4 : 3;
46  int err;
47 
48  err = av_grow_packet(out, sps_pps_size + in_size + start_code_size);
49  if (err < 0)
50  return err;
51 
52  if (sps_pps)
53  memcpy(out->data + offset, sps_pps, sps_pps_size);
54  memcpy(out->data + sps_pps_size + start_code_size + offset, in, in_size);
55  if (start_code_size == 4) {
56  AV_WB32(out->data + offset + sps_pps_size, 1);
57  } else {
58  (out->data + offset + sps_pps_size)[0] =
59  (out->data + offset + sps_pps_size)[1] = 0;
60  (out->data + offset + sps_pps_size)[2] = 1;
61  }
62 
63  return 0;
64 }
65 
66 static int h264_extradata_to_annexb(AVBSFContext *ctx, const int padding)
67 {
68  H264BSFContext *s = ctx->priv_data;
69  uint16_t unit_size;
70  uint64_t total_size = 0;
71  uint8_t *out = NULL, unit_nb, sps_done = 0,
72  sps_seen = 0, pps_seen = 0;
73  const uint8_t *extradata = ctx->par_in->extradata + 4;
74  static const uint8_t nalu_header[4] = { 0, 0, 0, 1 };
75  int length_size = (*extradata++ & 0x3) + 1; // retrieve length coded size
76 
77  s->sps_offset = s->pps_offset = -1;
78 
79  /* retrieve sps and pps unit(s) */
80  unit_nb = *extradata++ & 0x1f; /* number of sps unit(s) */
81  if (!unit_nb) {
82  goto pps;
83  } else {
84  s->sps_offset = 0;
85  sps_seen = 1;
86  }
87 
88  while (unit_nb--) {
89  int err;
90 
91  unit_size = AV_RB16(extradata);
92  total_size += unit_size + 4;
93  if (total_size > INT_MAX - padding) {
94  av_log(ctx, AV_LOG_ERROR,
95  "Too big extradata size, corrupted stream or invalid MP4/AVCC bitstream\n");
96  av_free(out);
97  return AVERROR(EINVAL);
98  }
99  if (extradata + 2 + unit_size > ctx->par_in->extradata + ctx->par_in->extradata_size) {
100  av_log(ctx, AV_LOG_ERROR, "Packet header is not contained in global extradata, "
101  "corrupted stream or invalid MP4/AVCC bitstream\n");
102  av_free(out);
103  return AVERROR(EINVAL);
104  }
105  if ((err = av_reallocp(&out, total_size + padding)) < 0)
106  return err;
107  memcpy(out + total_size - unit_size - 4, nalu_header, 4);
108  memcpy(out + total_size - unit_size, extradata + 2, unit_size);
109  extradata += 2 + unit_size;
110 pps:
111  if (!unit_nb && !sps_done++) {
112  unit_nb = *extradata++; /* number of pps unit(s) */
113  if (unit_nb) {
114  s->pps_offset = total_size;
115  pps_seen = 1;
116  }
117  }
118  }
119 
120  if (out)
121  memset(out + total_size, 0, padding);
122 
123  if (!sps_seen)
124  av_log(ctx, AV_LOG_WARNING,
125  "Warning: SPS NALU missing or invalid. "
126  "The resulting stream may not play.\n");
127 
128  if (!pps_seen)
129  av_log(ctx, AV_LOG_WARNING,
130  "Warning: PPS NALU missing or invalid. "
131  "The resulting stream may not play.\n");
132 
133  av_freep(&ctx->par_out->extradata);
134  ctx->par_out->extradata = out;
135  ctx->par_out->extradata_size = total_size;
136 
137  return length_size;
138 }
139 
141 {
142  H264BSFContext *s = ctx->priv_data;
143  int extra_size = ctx->par_in->extradata_size;
144  int ret;
145 
146  /* retrieve sps and pps NAL units from extradata */
147  if (!extra_size ||
148  (extra_size >= 3 && AV_RB24(ctx->par_in->extradata) == 1) ||
149  (extra_size >= 4 && AV_RB32(ctx->par_in->extradata) == 1)) {
150  av_log(ctx, AV_LOG_VERBOSE,
151  "The input looks like it is Annex B already\n");
152  } else if (extra_size >= 6) {
154  if (ret < 0)
155  return ret;
156 
157  s->length_size = ret;
158  s->new_idr = 1;
159  s->idr_sps_seen = 0;
160  s->idr_pps_seen = 0;
161  s->extradata_parsed = 1;
162  } else {
163  av_log(ctx, AV_LOG_ERROR, "Invalid extradata size: %d\n", extra_size);
164  return AVERROR_INVALIDDATA;
165  }
166 
167  return 0;
168 }
169 
171 {
172  H264BSFContext *s = ctx->priv_data;
173 
174  AVPacket *in;
175  uint8_t unit_type;
176  int32_t nal_size;
177  uint32_t cumul_size = 0;
178  const uint8_t *buf;
179  const uint8_t *buf_end;
180  int buf_size;
181  int ret = 0, i;
182 
183  ret = ff_bsf_get_packet(ctx, &in);
184  if (ret < 0)
185  return ret;
186 
187  /* nothing to filter */
188  if (!s->extradata_parsed) {
189  av_packet_move_ref(out, in);
190  av_packet_free(&in);
191  return 0;
192  }
193 
194  buf = in->data;
195  buf_size = in->size;
196  buf_end = in->data + in->size;
197 
198  do {
199  ret= AVERROR(EINVAL);
200  if (buf + s->length_size > buf_end)
201  goto fail;
202 
203  for (nal_size = 0, i = 0; i<s->length_size; i++)
204  nal_size = (nal_size << 8) | buf[i];
205 
206  buf += s->length_size;
207  unit_type = *buf & 0x1f;
208 
209  if (nal_size > buf_end - buf || nal_size < 0)
210  goto fail;
211 
212  if (unit_type == 7)
213  s->idr_sps_seen = s->new_idr = 1;
214  else if (unit_type == 8) {
215  s->idr_pps_seen = s->new_idr = 1;
216  /* if SPS has not been seen yet, prepend the AVCC one to PPS */
217  if (!s->idr_sps_seen) {
218  if (s->sps_offset == -1)
219  av_log(ctx, AV_LOG_WARNING, "SPS not present in the stream, nor in AVCC, stream may be unreadable\n");
220  else {
221  if ((ret = alloc_and_copy(out,
222  ctx->par_out->extradata + s->sps_offset,
223  s->pps_offset != -1 ? s->pps_offset : ctx->par_out->extradata_size - s->sps_offset,
224  buf, nal_size, 1)) < 0)
225  goto fail;
226  s->idr_sps_seen = 1;
227  goto next_nal;
228  }
229  }
230  }
231 
232  /* if this is a new IDR picture following an IDR picture, reset the idr flag.
233  * Just check first_mb_in_slice to be 0 as this is the simplest solution.
234  * This could be checking idr_pic_id instead, but would complexify the parsing. */
235  if (!s->new_idr && unit_type == 5 && (buf[1] & 0x80))
236  s->new_idr = 1;
237 
238  /* prepend only to the first type 5 NAL unit of an IDR picture, if no sps/pps are already present */
239  if (s->new_idr && unit_type == 5 && !s->idr_sps_seen && !s->idr_pps_seen) {
240  if ((ret=alloc_and_copy(out,
242  buf, nal_size, 1)) < 0)
243  goto fail;
244  s->new_idr = 0;
245  /* if only SPS has been seen, also insert PPS */
246  } else if (s->new_idr && unit_type == 5 && s->idr_sps_seen && !s->idr_pps_seen) {
247  if (s->pps_offset == -1) {
248  av_log(ctx, AV_LOG_WARNING, "PPS not present in the stream, nor in AVCC, stream may be unreadable\n");
249  if ((ret = alloc_and_copy(out, NULL, 0, buf, nal_size, 0)) < 0)
250  goto fail;
251  } else if ((ret = alloc_and_copy(out,
253  buf, nal_size, 1)) < 0)
254  goto fail;
255  } else {
256  if ((ret=alloc_and_copy(out, NULL, 0, buf, nal_size, unit_type == 7 || unit_type == 8)) < 0)
257  goto fail;
258  if (!s->new_idr && unit_type == 1) {
259  s->new_idr = 1;
260  s->idr_sps_seen = 0;
261  s->idr_pps_seen = 0;
262  }
263  }
264 
265 next_nal:
266  buf += nal_size;
267  cumul_size += nal_size + s->length_size;
268  } while (cumul_size < buf_size);
269 
270  ret = av_packet_copy_props(out, in);
271  if (ret < 0)
272  goto fail;
273 
274 fail:
275  if (ret < 0)
276  av_packet_unref(out);
277  av_packet_free(&in);
278 
279  return ret;
280 }
281 
282 static const enum AVCodecID codec_ids[] = {
284 };
285 
287  .name = "h264_mp4toannexb",
288  .priv_data_size = sizeof(H264BSFContext),
291  .codec_ids = codec_ids,
292 };
#define NULL
Definition: coverity.c:32
const char * s
Definition: avisynth_c.h:768
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
AVCodecParameters * par_out
Parameters of the output stream.
Definition: avcodec.h:5721
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:182
Memory handling functions.
static av_cold int init(AVCodecContext *avctx)
Definition: avrndec.c:35
The bitstream filter state.
Definition: avcodec.h:5687
int size
Definition: avcodec.h:1431
#define AV_RB24
Definition: intreadwrite.h:64
static int h264_mp4toannexb_init(AVBSFContext *ctx)
void * priv_data
Opaque filter-specific private data.
Definition: avcodec.h:5708
static void filter(int16_t *output, ptrdiff_t out_stride, int16_t *low, ptrdiff_t low_stride, int16_t *high, ptrdiff_t high_stride, int len, int clip)
Definition: cfhd.c:114
void av_packet_free(AVPacket **pkt)
Free the packet, if the packet is reference counted, it will be unreferenced first.
Definition: avpacket.c:62
uint8_t
#define AV_RB32
Definition: intreadwrite.h:130
const char * name
Definition: avcodec.h:5737
uint8_t * data
Definition: avcodec.h:1430
void av_packet_move_ref(AVPacket *dst, AVPacket *src)
Move every field in src to dst and reset src.
Definition: avpacket.c:647
static int h264_extradata_to_annexb(AVBSFContext *ctx, const int padding)
#define AV_LOG_VERBOSE
Detailed information.
Definition: log.h:192
#define av_log(a,...)
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: avcodec.h:215
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:176
#define AV_RB16
Definition: intreadwrite.h:53
#define AVERROR(e)
Definition: error.h:43
static const uint8_t offset[127][2]
Definition: vf_spp.c:92
#define fail()
Definition: checkasm.h:116
int extradata_size
Size of the extradata content in bytes.
Definition: avcodec.h:3902
int av_packet_copy_props(AVPacket *dst, const AVPacket *src)
Copy only "properties" fields from src to dst.
Definition: avpacket.c:558
int32_t
AVFormatContext * ctx
Definition: movenc.c:48
static int alloc_and_copy(AVPacket *out, const uint8_t *sps_pps, uint32_t sps_pps_size, const uint8_t *in, uint32_t in_size, int ps)
static int h264_mp4toannexb_filter(AVBSFContext *ctx, AVPacket *out)
int av_reallocp(void *ptr, size_t size)
Allocate, reallocate, or free a block of memory through a pointer to a pointer.
Definition: mem.c:163
Libavcodec external API header.
void av_packet_unref(AVPacket *pkt)
Wipe the packet.
Definition: avpacket.c:592
void * buf
Definition: avisynth_c.h:690
uint8_t pi<< 24) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0f/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_U8, uint8_t,(*(const uint8_t *) pi - 0x80) *(1.0/(1<< 7))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S16, int16_t,(*(const int16_t *) pi >> 8)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0f/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S16, int16_t, *(const int16_t *) pi *(1.0/(1<< 15))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_S32, int32_t,(*(const int32_t *) pi >> 24)+0x80) CONV_FUNC_GROUP(AV_SAMPLE_FMT_FLT, float, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0f/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_DBL, double, AV_SAMPLE_FMT_S32, int32_t, *(const int32_t *) pi *(1.0/(1U<< 31))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_FLT, float, av_clip_uint8(lrintf(*(const float *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_FLT, float, av_clip_int16(lrintf(*(const float *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_FLT, float, av_clipl_int32(llrintf(*(const float *) pi *(1U<< 31)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_U8, uint8_t, AV_SAMPLE_FMT_DBL, double, av_clip_uint8(lrint(*(const double *) pi *(1<< 7))+0x80)) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S16, int16_t, AV_SAMPLE_FMT_DBL, double, av_clip_int16(lrint(*(const double *) pi *(1<< 15)))) CONV_FUNC_GROUP(AV_SAMPLE_FMT_S32, int32_t, AV_SAMPLE_FMT_DBL, double, av_clipl_int32(llrint(*(const double *) pi *(1U<< 31)))) #define SET_CONV_FUNC_GROUP(ofmt, ifmt) static void set_generic_function(AudioConvert *ac) { } void ff_audio_convert_free(AudioConvert **ac) { if(! *ac) return;ff_dither_free(&(*ac) ->dc);av_freep(ac);} AudioConvert *ff_audio_convert_alloc(AVAudioResampleContext *avr, enum AVSampleFormat out_fmt, enum AVSampleFormat in_fmt, int channels, int sample_rate, int apply_map) { AudioConvert *ac;int in_planar, out_planar;ac=av_mallocz(sizeof(*ac));if(!ac) return NULL;ac->avr=avr;ac->out_fmt=out_fmt;ac->in_fmt=in_fmt;ac->channels=channels;ac->apply_map=apply_map;if(avr->dither_method !=AV_RESAMPLE_DITHER_NONE &&av_get_packed_sample_fmt(out_fmt)==AV_SAMPLE_FMT_S16 &&av_get_bytes_per_sample(in_fmt) > 2) { ac->dc=ff_dither_alloc(avr, out_fmt, in_fmt, channels, sample_rate, apply_map);if(!ac->dc) { av_free(ac);return NULL;} return ac;} in_planar=ff_sample_fmt_is_planar(in_fmt, channels);out_planar=ff_sample_fmt_is_planar(out_fmt, channels);if(in_planar==out_planar) { ac->func_type=CONV_FUNC_TYPE_FLAT;ac->planes=in_planar ? ac->channels :1;} else if(in_planar) ac->func_type=CONV_FUNC_TYPE_INTERLEAVE;else ac->func_type=CONV_FUNC_TYPE_DEINTERLEAVE;set_generic_function(ac);if(ARCH_AARCH64) ff_audio_convert_init_aarch64(ac);if(ARCH_ARM) ff_audio_convert_init_arm(ac);if(ARCH_X86) ff_audio_convert_init_x86(ac);return ac;} int ff_audio_convert(AudioConvert *ac, AudioData *out, AudioData *in) { int use_generic=1;int len=in->nb_samples;int p;if(ac->dc) { av_log(ac->avr, AV_LOG_TRACE, "%d samples - audio_convert: %s to %s (dithered)\", len, av_get_sample_fmt_name(ac->in_fmt), av_get_sample_fmt_name(ac->out_fmt));return ff_convert_dither(ac-> in
static int FUNC() pps(CodedBitstreamContext *ctx, RWContext *rw, H264RawPPS *current)
#define AV_WB32(p, v)
Definition: intreadwrite.h:419
static enum AVCodecID codec_ids[]
int ff_bsf_get_packet(AVBSFContext *ctx, AVPacket **pkt)
Called by the bitstream filters to get the next packet for filtering.
Definition: bsf.c:206
int av_grow_packet(AVPacket *pkt, int grow_by)
Increase packet size, correctly zeroing padding.
Definition: avpacket.c:109
#define AV_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
Definition: avcodec.h:773
const AVBitStreamFilter ff_h264_mp4toannexb_bsf
#define av_free(p)
uint8_t * extradata
Extra binary data needed for initializing the decoder, codec-dependent.
Definition: avcodec.h:3898
FILE * out
Definition: movenc.c:54
#define av_freep(p)
This structure stores compressed data.
Definition: avcodec.h:1407
AVCodecParameters * par_in
Parameters of the input stream.
Definition: avcodec.h:5715