FFmpeg
flac_picture.c
Go to the documentation of this file.
1 /*
2  * Raw FLAC picture parser
3  * Copyright (c) 2001 Fabrice Bellard
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include "libavutil/intreadwrite.h"
23 #include "libavcodec/bytestream.h"
24 #include "libavcodec/png.h"
25 #include "avformat.h"
26 #include "flac_picture.h"
27 #include "id3v2.h"
28 #include "internal.h"
29 
30 #define MAX_TRUNC_PICTURE_SIZE (500 * 1024 * 1024)
31 
32 int ff_flac_parse_picture(AVFormatContext *s, uint8_t **bufp, int buf_size,
33  int truncate_workaround)
34 {
35  const CodecMime *mime = ff_id3v2_mime_tags;
36  enum AVCodecID id = AV_CODEC_ID_NONE;
38  uint8_t mimetype[64], *buf = *bufp;
39  const uint8_t *desc = NULL;
41  AVStream *st;
42  int width, height, ret = 0;
43  unsigned int type;
44  uint32_t len, left, trunclen = 0;
45 
46  if (buf_size < 34) {
47  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
48  if (s->error_recognition & AV_EF_EXPLODE)
49  return AVERROR_INVALIDDATA;
50  return 0;
51  }
52 
53  bytestream2_init(&g, buf, buf_size);
54 
55  /* read the picture type */
56  type = bytestream2_get_be32u(&g);
58  av_log(s, AV_LOG_ERROR, "Invalid picture type: %d.\n", type);
59  if (s->error_recognition & AV_EF_EXPLODE) {
60  return AVERROR_INVALIDDATA;
61  }
62  type = 0;
63  }
64 
65  /* picture mimetype */
66  len = bytestream2_get_be32u(&g);
67  if (len <= 0 || len >= sizeof(mimetype)) {
68  av_log(s, AV_LOG_ERROR, "Could not read mimetype from an attached "
69  "picture.\n");
70  if (s->error_recognition & AV_EF_EXPLODE)
71  return AVERROR_INVALIDDATA;
72  return 0;
73  }
74  if (len + 24 > bytestream2_get_bytes_left(&g)) {
75  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
76  if (s->error_recognition & AV_EF_EXPLODE)
77  return AVERROR_INVALIDDATA;
78  return 0;
79  }
80  bytestream2_get_bufferu(&g, mimetype, len);
81  mimetype[len] = 0;
82 
83  while (mime->id != AV_CODEC_ID_NONE) {
84  if (!strncmp(mime->str, mimetype, sizeof(mimetype))) {
85  id = mime->id;
86  break;
87  }
88  mime++;
89  }
90  if (id == AV_CODEC_ID_NONE) {
91  av_log(s, AV_LOG_ERROR, "Unknown attached picture mimetype: %s.\n",
92  mimetype);
93  if (s->error_recognition & AV_EF_EXPLODE)
94  return AVERROR_INVALIDDATA;
95  return 0;
96  }
97 
98  /* picture description */
99  len = bytestream2_get_be32u(&g);
100  if (len > bytestream2_get_bytes_left(&g) - 20) {
101  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
102  if (s->error_recognition & AV_EF_EXPLODE)
103  return AVERROR_INVALIDDATA;
104  return 0;
105  }
106  if (len > 0) {
107  desc = g.buffer;
109  }
110 
111  /* picture metadata */
112  width = bytestream2_get_be32u(&g);
113  ((uint8_t*)g.buffer)[-4] = '\0'; // NUL-terminate desc.
114  height = bytestream2_get_be32u(&g);
115  bytestream2_skipu(&g, 8);
116 
117  /* picture data */
118  len = bytestream2_get_be32u(&g);
119 
121  if (len <= 0 || len > left) {
123  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too big %u\n", len);
124  if (s->error_recognition & AV_EF_EXPLODE)
125  return AVERROR_INVALIDDATA;
126  return 0;
127  }
128 
129  // Workaround bug for flac muxers that writs truncated metadata picture block size if
130  // the picture size do not fit in 24 bits. lavf flacenc used to have the issue and based
131  // on existing broken files other unknown flac muxers seems to truncate also.
132  if (truncate_workaround &&
133  s->strict_std_compliance <= FF_COMPLIANCE_NORMAL &&
134  len > left && (len & 0xffffff) == left) {
135  av_log(s, AV_LOG_INFO, "Correcting truncated metadata picture size from %u to %u\n", left, len);
136  trunclen = len - left;
137  } else {
138  av_log(s, AV_LOG_ERROR, "Attached picture metadata block too short\n");
139  if (s->error_recognition & AV_EF_EXPLODE)
140  return AVERROR_INVALIDDATA;
141  return 0;
142  }
143  }
144  if (trunclen == 0 && len >= buf_size - (buf_size >> 4)) {
147  if (!data)
148  return AVERROR(ENOMEM);
149  *bufp = NULL;
150  data->data += bytestream2_tell(&g);
152  } else {
154  return AVERROR(ENOMEM);
155 
156  if (trunclen == 0) {
157  bytestream2_get_bufferu(&g, data->data, len);
158  } else {
159  // If truncation was detected copy all data from block and
160  // read missing bytes not included in the block size.
162  if (avio_read(s->pb, data->data + len - trunclen, trunclen) < trunclen)
164  }
165  }
166  memset(data->data + len, 0, AV_INPUT_BUFFER_PADDING_SIZE);
167 
168  if (AV_RB64(data->data) == PNGSIG)
169  id = AV_CODEC_ID_PNG;
170 
172  if (ret < 0)
173  RETURN_ERROR(ret);
174 
175  st = s->streams[s->nb_streams - 1];
176  st->codecpar->codec_id = id;
177  st->codecpar->width = width;
178  st->codecpar->height = height;
179  av_dict_set(&st->metadata, "comment", ff_id3v2_picture_types[type], 0);
180  if (desc)
181  av_dict_set(&st->metadata, "title", desc, 0);
182 
183  return 0;
184 
185 fail:
187 
188  return ret;
189 }
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
GetByteContext
Definition: bytestream.h:33
bytestream2_skipu
static av_always_inline void bytestream2_skipu(GetByteContext *g, unsigned int size)
Definition: bytestream.h:174
id3v2.h
data
const char data[16]
Definition: mxf.c:143
CodecMime
Definition: internal.h:56
fail
#define fail()
Definition: checkasm.h:127
type
it s the only field you need to keep assuming you have a context There is some magic you don t need to care about around this just let it vf type
Definition: writing_filters.txt:86
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:180
FF_ARRAY_ELEMS
#define FF_ARRAY_ELEMS(a)
Definition: sinewin_tablegen.c:29
width
#define width
intreadwrite.h
s
#define s(width, name)
Definition: cbs_vp9.c:257
g
const char * g
Definition: vf_curves.c:117
AVCodecParameters::width
int width
Video only.
Definition: codec_par.h:126
av_buffer_default_free
void av_buffer_default_free(void *opaque, uint8_t *data)
Default free callback, which calls av_free() on the buffer data.
Definition: buffer.c:72
flac_picture.h
AV_CODEC_ID_PNG
@ AV_CODEC_ID_PNG
Definition: codec_id.h:111
AVFormatContext
Format I/O context.
Definition: avformat.h:1200
internal.h
AVStream::codecpar
AVCodecParameters * codecpar
Codec parameters associated with this stream.
Definition: avformat.h:1095
NULL
#define NULL
Definition: coverity.c:32
av_buffer_unref
void av_buffer_unref(AVBufferRef **buf)
Free a given reference and automatically free the buffer if there are no more references to it.
Definition: buffer.c:139
AVStream::metadata
AVDictionary * metadata
Definition: avformat.h:1006
AV_EF_EXPLODE
#define AV_EF_EXPLODE
abort decoding on minor error detection
Definition: avcodec.h:1335
ff_id3v2_picture_types
const char *const ff_id3v2_picture_types[21]
Definition: id3v2.c:107
ff_flac_parse_picture
int ff_flac_parse_picture(AVFormatContext *s, uint8_t **bufp, int buf_size, int truncate_workaround)
Parse a FLAC METADATA_BLOCK_PICTURE.
Definition: flac_picture.c:32
av_buffer_create
AVBufferRef * av_buffer_create(uint8_t *data, size_t size, void(*free)(void *opaque, uint8_t *data), void *opaque, int flags)
Create an AVBuffer from an existing array.
Definition: buffer.c:55
ff_id3v2_mime_tags
const CodecMime ff_id3v2_mime_tags[]
Definition: id3v2.c:131
bytestream2_get_bytes_left
static av_always_inline int bytestream2_get_bytes_left(GetByteContext *g)
Definition: bytestream.h:158
AVCodecID
AVCodecID
Identify the syntax and semantics of the bitstream.
Definition: codec_id.h:47
bytestream2_tell
static av_always_inline int bytestream2_tell(GetByteContext *g)
Definition: bytestream.h:192
id
enum AVCodecID id
Definition: extract_extradata_bsf.c:325
height
#define height
av_buffer_alloc
AVBufferRef * av_buffer_alloc(size_t size)
Allocate an AVBuffer of the given size using av_malloc().
Definition: buffer.c:77
FF_COMPLIANCE_NORMAL
#define FF_COMPLIANCE_NORMAL
Definition: avcodec.h:1283
PNGSIG
#define PNGSIG
Definition: png.h:49
AV_LOG_INFO
#define AV_LOG_INFO
Standard information.
Definition: log.h:191
RETURN_ERROR
#define RETURN_ERROR(code)
Definition: flac_picture.h:27
AV_CODEC_ID_NONE
@ AV_CODEC_ID_NONE
Definition: codec_id.h:48
AVCodecParameters::height
int height
Definition: codec_par.h:127
len
int len
Definition: vorbis_enc_data.h:426
ret
ret
Definition: filter_design.txt:187
AVStream
Stream structure.
Definition: avformat.h:935
avformat.h
AV_INPUT_BUFFER_PADDING_SIZE
#define AV_INPUT_BUFFER_PADDING_SIZE
Definition: defs.h:40
left
Tag MUST be and< 10hcoeff half pel interpolation filter coefficients, hcoeff[0] are the 2 middle coefficients[1] are the next outer ones and so on, resulting in a filter like:...eff[2], hcoeff[1], hcoeff[0], hcoeff[0], hcoeff[1], hcoeff[2] ... the sign of the coefficients is not explicitly stored but alternates after each coeff and coeff[0] is positive, so ...,+,-,+,-,+,+,-,+,-,+,... hcoeff[0] is not explicitly stored but found by subtracting the sum of all stored coefficients with signs from 32 hcoeff[0]=32 - hcoeff[1] - hcoeff[2] - ... a good choice for hcoeff and htaps is htaps=6 hcoeff={40,-10, 2} an alternative which requires more computations at both encoder and decoder side and may or may not be better is htaps=8 hcoeff={42,-14, 6,-2}ref_frames minimum of the number of available reference frames and max_ref_frames for example the first frame after a key frame always has ref_frames=1spatial_decomposition_type wavelet type 0 is a 9/7 symmetric compact integer wavelet 1 is a 5/3 symmetric compact integer wavelet others are reserved stored as delta from last, last is reset to 0 if always_reset||keyframeqlog quality(logarithmic quantizer scale) stored as delta from last, last is reset to 0 if always_reset||keyframemv_scale stored as delta from last, last is reset to 0 if always_reset||keyframe FIXME check that everything works fine if this changes between framesqbias dequantization bias stored as delta from last, last is reset to 0 if always_reset||keyframeblock_max_depth maximum depth of the block tree stored as delta from last, last is reset to 0 if always_reset||keyframequant_table quantization tableHighlevel bitstream structure:==============================--------------------------------------------|Header|--------------------------------------------|------------------------------------|||Block0||||split?||||yes no||||......... intra?||||:Block01 :yes no||||:Block02 :....... ..........||||:Block03 ::y DC ::ref index:||||:Block04 ::cb DC ::motion x :||||......... :cr DC ::motion y :||||....... ..........|||------------------------------------||------------------------------------|||Block1|||...|--------------------------------------------|------------ ------------ ------------|||Y subbands||Cb subbands||Cr subbands||||--- ---||--- ---||--- ---|||||LL0||HL0||||LL0||HL0||||LL0||HL0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||LH0||HH0||||LH0||HH0||||LH0||HH0|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HL1||LH1||||HL1||LH1||||HL1||LH1|||||--- ---||--- ---||--- ---||||--- ---||--- ---||--- ---|||||HH1||HL2||||HH1||HL2||||HH1||HL2|||||...||...||...|||------------ ------------ ------------|--------------------------------------------Decoding process:=================------------|||Subbands|------------||||------------|Intra DC||||LL0 subband prediction ------------|\ Dequantization ------------------- \||Reference frames|\ IDWT|------- -------|Motion \|||Frame 0||Frame 1||Compensation . OBMC v -------|------- -------|--------------. \------> Frame n output Frame Frame<----------------------------------/|...|------------------- Range Coder:============Binary Range Coder:------------------- The implemented range coder is an adapted version based upon "Range encoding: an algorithm for removing redundancy from a digitised message." by G. N. N. Martin. The symbols encoded by the Snow range coder are bits(0|1). The associated probabilities are not fix but change depending on the symbol mix seen so far. bit seen|new state ---------+----------------------------------------------- 0|256 - state_transition_table[256 - old_state];1|state_transition_table[old_state];state_transition_table={ 0, 0, 0, 0, 0, 0, 0, 0, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 190, 191, 192, 194, 194, 195, 196, 197, 198, 199, 200, 201, 202, 202, 204, 205, 206, 207, 208, 209, 209, 210, 211, 212, 213, 215, 215, 216, 217, 218, 219, 220, 220, 222, 223, 224, 225, 226, 227, 227, 229, 229, 230, 231, 232, 234, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 248, 0, 0, 0, 0, 0, 0, 0};FIXME Range Coding of integers:------------------------- FIXME Neighboring Blocks:===================left and top are set to the respective blocks unless they are outside of the image in which case they are set to the Null block top-left is set to the top left block unless it is outside of the image in which case it is set to the left block if this block has no larger parent block or it is at the left side of its parent block and the top right block is not outside of the image then the top right block is used for top-right else the top-left block is used Null block y, cb, cr are 128 level, ref, mx and my are 0 Motion Vector Prediction:=========================1. the motion vectors of all the neighboring blocks are scaled to compensate for the difference of reference frames scaled_mv=(mv *(256 *(current_reference+1)/(mv.reference+1))+128)> the median of the scaled left
Definition: snow.txt:386
avio_read
int avio_read(AVIOContext *s, unsigned char *buf, int size)
Read size bytes from AVIOContext into buf.
Definition: aviobuf.c:641
CodecMime::str
char str[32]
Definition: internal.h:57
MAX_TRUNC_PICTURE_SIZE
#define MAX_TRUNC_PICTURE_SIZE
Definition: flac_picture.c:30
CodecMime::id
enum AVCodecID id
Definition: internal.h:58
desc
const char * desc
Definition: libsvtav1.c:79
AVBufferRef
A reference to a data buffer.
Definition: buffer.h:82
bytestream2_get_bufferu
static av_always_inline unsigned int bytestream2_get_bufferu(GetByteContext *g, uint8_t *dst, unsigned int size)
Definition: bytestream.h:277
AVCodecParameters::codec_id
enum AVCodecID codec_id
Specific type of the encoded data (the codec used).
Definition: codec_par.h:60
png.h
av_dict_set
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:70
bytestream.h
bytestream2_init
static av_always_inline void bytestream2_init(GetByteContext *g, const uint8_t *buf, int buf_size)
Definition: bytestream.h:137
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:61
AV_RB64
uint64_t_TMPL AV_WL64 unsigned int_TMPL AV_WL32 unsigned int_TMPL AV_WL24 unsigned int_TMPL AV_WL16 uint64_t_TMPL AV_RB64
Definition: bytestream.h:95
ff_add_attached_pic
int ff_add_attached_pic(AVFormatContext *s, AVStream *st, AVIOContext *pb, AVBufferRef **buf, int size)
Add an attached pic to an AVStream.
Definition: utils.c:250