FFmpeg
vorbis_parser.c
Go to the documentation of this file.
1 /*
2  * Copyright (c) 2012 Justin Ruggles
3  *
4  * This file is part of FFmpeg.
5  *
6  * FFmpeg is free software; you can redistribute it and/or
7  * modify it under the terms of the GNU Lesser General Public
8  * License as published by the Free Software Foundation; either
9  * version 2.1 of the License, or (at your option) any later version.
10  *
11  * FFmpeg is distributed in the hope that it will be useful,
12  * but WITHOUT ANY WARRANTY; without even the implied warranty of
13  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
14  * Lesser General Public License for more details.
15  *
16  * You should have received a copy of the GNU Lesser General Public
17  * License along with FFmpeg; if not, write to the Free Software
18  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
19  */
20 
21 /**
22  * @file
23  * Vorbis audio parser
24  *
25  * Determines the duration for each packet.
26  */
27 
28 #include "libavutil/log.h"
29 
30 #include "get_bits.h"
31 #include "parser.h"
32 #include "xiph.h"
33 #include "vorbis_parser_internal.h"
34 
35 static const AVClass vorbis_parser_class = {
36  .class_name = "Vorbis parser",
37  .item_name = av_default_item_name,
38  .version = LIBAVUTIL_VERSION_INT,
39 };
40 
42  const uint8_t *buf, int buf_size)
43 {
44  /* Id header should be 30 bytes */
45  if (buf_size < 30) {
46  av_log(s, AV_LOG_ERROR, "Id header is too short\n");
47  return AVERROR_INVALIDDATA;
48  }
49 
50  /* make sure this is the Id header */
51  if (buf[0] != 1) {
52  av_log(s, AV_LOG_ERROR, "Wrong packet type in Id header\n");
53  return AVERROR_INVALIDDATA;
54  }
55 
56  /* check for header signature */
57  if (memcmp(&buf[1], "vorbis", 6)) {
58  av_log(s, AV_LOG_ERROR, "Invalid packet signature in Id header\n");
59  return AVERROR_INVALIDDATA;
60  }
61 
62  if (!(buf[29] & 0x1)) {
63  av_log(s, AV_LOG_ERROR, "Invalid framing bit in Id header\n");
64  return AVERROR_INVALIDDATA;
65  }
66 
67  s->blocksize[0] = 1 << (buf[28] & 0xF);
68  s->blocksize[1] = 1 << (buf[28] >> 4);
69 
70  return 0;
71 }
72 
74  const uint8_t *buf, int buf_size)
75 {
76  GetBitContext gb, gb0;
77  uint8_t *rev_buf;
78  int i, ret = 0;
79  int got_framing_bit, mode_count, got_mode_header, last_mode_count = 0;
80 
81  /* avoid overread */
82  if (buf_size < 7) {
83  av_log(s, AV_LOG_ERROR, "Setup header is too short\n");
84  return AVERROR_INVALIDDATA;
85  }
86 
87  /* make sure this is the Setup header */
88  if (buf[0] != 5) {
89  av_log(s, AV_LOG_ERROR, "Wrong packet type in Setup header\n");
90  return AVERROR_INVALIDDATA;
91  }
92 
93  /* check for header signature */
94  if (memcmp(&buf[1], "vorbis", 6)) {
95  av_log(s, AV_LOG_ERROR, "Invalid packet signature in Setup header\n");
96  return AVERROR_INVALIDDATA;
97  }
98 
99  /* reverse bytes so we can easily read backwards with get_bits() */
100  if (!(rev_buf = av_malloc(buf_size))) {
101  av_log(s, AV_LOG_ERROR, "Out of memory\n");
102  return AVERROR(ENOMEM);
103  }
104  for (i = 0; i < buf_size; i++)
105  rev_buf[i] = buf[buf_size - 1 - i];
106  init_get_bits(&gb, rev_buf, buf_size * 8);
107 
108  got_framing_bit = 0;
109  while (get_bits_left(&gb) > 97) {
110  if (get_bits1(&gb)) {
111  got_framing_bit = get_bits_count(&gb);
112  break;
113  }
114  }
115  if (!got_framing_bit) {
116  av_log(s, AV_LOG_ERROR, "Invalid Setup header\n");
118  goto bad_header;
119  }
120 
121  /* Now we search backwards to find possible valid mode counts. This is not
122  * fool-proof because we could have false positive matches and read too
123  * far, but there isn't really any way to be sure without parsing through
124  * all the many variable-sized fields before the modes. This approach seems
125  * to work well in testing, and it is similar to how it is handled in
126  * liboggz. */
127  mode_count = 0;
128  got_mode_header = 0;
129  while (get_bits_left(&gb) >= 97) {
130  if (get_bits(&gb, 8) > 63 || get_bits(&gb, 16) || get_bits(&gb, 16))
131  break;
132  skip_bits(&gb, 1);
133  mode_count++;
134  if (mode_count > 64)
135  break;
136  gb0 = gb;
137  if (get_bits(&gb0, 6) + 1 == mode_count) {
138  got_mode_header = 1;
139  last_mode_count = mode_count;
140  }
141  }
142  if (!got_mode_header) {
143  av_log(s, AV_LOG_ERROR, "Invalid Setup header\n");
145  goto bad_header;
146  }
147  /* All samples I've seen use <= 2 modes, so ask for a sample if we find
148  * more than that, as it is most likely a false positive. If we get any
149  * we may need to approach this the long way and parse the whole Setup
150  * header, but I hope very much that it never comes to that. */
151  if (last_mode_count > 2) {
153  "%d modes (either a false positive or a "
154  "sample from an unknown encoder)",
155  last_mode_count);
156  }
157  /* We're limiting the mode count to 63 so that we know that the previous
158  * block flag will be in the first packet byte. */
159  if (last_mode_count > 63) {
160  av_log(s, AV_LOG_ERROR, "Unsupported mode count: %d\n",
161  last_mode_count);
163  goto bad_header;
164  }
165  s->mode_count = mode_count = last_mode_count;
166  /* Determine the number of bits required to code the mode and turn that
167  * into a bitmask to directly access the mode from the first frame byte. */
168  s->mode_mask = ((1 << (av_log2(mode_count - 1) + 1)) - 1) << 1;
169  /* The previous window flag is the next bit after the mode */
170  s->prev_mask = (s->mode_mask | 0x1) + 1;
171 
172  init_get_bits(&gb, rev_buf, buf_size * 8);
173  skip_bits_long(&gb, got_framing_bit);
174  for (i = mode_count - 1; i >= 0; i--) {
175  skip_bits_long(&gb, 40);
176  s->mode_blocksize[i] = get_bits1(&gb);
177  }
178 
179 bad_header:
180  av_free(rev_buf);
181  return ret;
182 }
183 
185  const uint8_t *extradata, int extradata_size)
186 {
187  const uint8_t *header_start[3];
188  int header_len[3];
189  int ret;
190 
191  s->class = &vorbis_parser_class;
192  s->extradata_parsed = 1;
193 
194  if ((ret = avpriv_split_xiph_headers(extradata,
195  extradata_size, 30,
196  header_start, header_len)) < 0) {
197  av_log(s, AV_LOG_ERROR, "Extradata corrupt.\n");
198  return ret;
199  }
200 
201  if ((ret = parse_id_header(s, header_start[0], header_len[0])) < 0)
202  return ret;
203 
204  if ((ret = parse_setup_header(s, header_start[2], header_len[2])) < 0)
205  return ret;
206 
207  s->valid_extradata = 1;
208  s->previous_blocksize = s->blocksize[s->mode_blocksize[0]];
209 
210  return 0;
211 }
212 
214  int buf_size, int *flags)
215 {
216  int duration = 0;
217 
218  if (s->valid_extradata && buf_size > 0) {
219  int mode, current_blocksize;
220  int previous_blocksize = s->previous_blocksize;
221 
222  if (buf[0] & 1) {
223  /* If the user doesn't care about special packets, it's a bad one. */
224  if (!flags)
225  goto bad_packet;
226 
227  /* Set the flag for which kind of special packet it is. */
228  if (buf[0] == 1)
230  else if (buf[0] == 3)
232  else if (buf[0] == 5)
234  else
235  goto bad_packet;
236 
237  /* Special packets have no duration. */
238  return 0;
239 
240 bad_packet:
241  av_log(s, AV_LOG_ERROR, "Invalid packet\n");
242  return AVERROR_INVALIDDATA;
243  }
244  if (s->mode_count == 1)
245  mode = 0;
246  else
247  mode = (buf[0] & s->mode_mask) >> 1;
248  if (mode >= s->mode_count) {
249  av_log(s, AV_LOG_ERROR, "Invalid mode in packet\n");
250  return AVERROR_INVALIDDATA;
251  }
252  if(s->mode_blocksize[mode]){
253  int flag = !!(buf[0] & s->prev_mask);
254  previous_blocksize = s->blocksize[flag];
255  }
256  current_blocksize = s->blocksize[s->mode_blocksize[mode]];
257  duration = (previous_blocksize + current_blocksize) >> 2;
258  s->previous_blocksize = current_blocksize;
259  }
260 
261  return duration;
262 }
263 
265  int buf_size)
266 {
267  return av_vorbis_parse_frame_flags(s, buf, buf_size, NULL);
268 }
269 
271 {
272  if (s->valid_extradata)
273  s->previous_blocksize = s->blocksize[0];
274 }
275 
277 {
278  av_freep(s);
279 }
280 
282  int extradata_size)
283 {
284  AVVorbisParseContext *s = av_mallocz(sizeof(*s));
285  int ret;
286 
287  if (!s)
288  return NULL;
289 
290  ret = vorbis_parse_init(s, extradata, extradata_size);
291  if (ret < 0) {
293  return NULL;
294  }
295 
296  return s;
297 }
298 
299 #if CONFIG_VORBIS_PARSER
300 
301 typedef struct VorbisParseContext {
303 } VorbisParseContext;
304 
305 static int vorbis_parse(AVCodecParserContext *s1, AVCodecContext *avctx,
306  const uint8_t **poutbuf, int *poutbuf_size,
307  const uint8_t *buf, int buf_size)
308 {
309  VorbisParseContext *s = s1->priv_data;
310  int duration;
311 
312  if (!s->vp && avctx->extradata && avctx->extradata_size) {
313  s->vp = av_vorbis_parse_init(avctx->extradata, avctx->extradata_size);
314  }
315  if (!s->vp)
316  goto end;
317 
318  if ((duration = av_vorbis_parse_frame(s->vp, buf, buf_size)) >= 0)
319  s1->duration = duration;
320 
321 end:
322  /* always return the full packet. this parser isn't doing any splitting or
323  combining, only packet analysis */
324  *poutbuf = buf;
325  *poutbuf_size = buf_size;
326  return buf_size;
327 }
328 
329 static void vorbis_parser_close(AVCodecParserContext *ctx)
330 {
331  VorbisParseContext *s = ctx->priv_data;
332  av_vorbis_parse_free(&s->vp);
333 }
334 
337  .priv_data_size = sizeof(VorbisParseContext),
338  .parser_parse = vorbis_parse,
339  .parser_close = vorbis_parser_close,
340 };
341 #endif /* CONFIG_VORBIS_PARSER */
skip_bits_long
static void skip_bits_long(GetBitContext *s, int n)
Skips the specified number of bits.
Definition: get_bits.h:291
av_vorbis_parse_free
void av_vorbis_parse_free(AVVorbisParseContext **s)
Free the parser and everything associated with it.
Definition: vorbis_parser.c:276
get_bits_left
static int get_bits_left(GetBitContext *gb)
Definition: get_bits.h:849
AVERROR
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFrame structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later. That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another. Frame references ownership and permissions
AVVorbisParseContext
Definition: vorbis_parser_internal.h:34
av_vorbis_parse_frame_flags
int av_vorbis_parse_frame_flags(AVVorbisParseContext *s, const uint8_t *buf, int buf_size, int *flags)
Get the duration for a Vorbis packet.
Definition: vorbis_parser.c:213
get_bits_count
static int get_bits_count(const GetBitContext *s)
Definition: get_bits.h:219
av_vorbis_parse_frame
int av_vorbis_parse_frame(AVVorbisParseContext *s, const uint8_t *buf, int buf_size)
Get the duration for a Vorbis packet.
Definition: vorbis_parser.c:264
init_get_bits
static int init_get_bits(GetBitContext *s, const uint8_t *buffer, int bit_size)
Initialize GetBitContext.
Definition: get_bits.h:659
av_malloc
#define av_malloc(s)
Definition: tableprint_vlc.h:31
xiph.h
skip_bits
static void skip_bits(GetBitContext *s, int n)
Definition: get_bits.h:467
get_bits
static unsigned int get_bits(GetBitContext *s, int n)
Read 1-25 bits.
Definition: get_bits.h:379
GetBitContext
Definition: get_bits.h:61
AV_LOG_ERROR
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:194
duration
int64_t duration
Definition: movenc.c:64
AVCodecContext::extradata_size
int extradata_size
Definition: avcodec.h:638
s
#define s(width, name)
Definition: cbs_vp9.c:257
s1
#define s1
Definition: regdef.h:38
VORBIS_FLAG_COMMENT
#define VORBIS_FLAG_COMMENT
Definition: vorbis_parser.h:45
ctx
AVFormatContext * ctx
Definition: movenc.c:48
get_bits.h
LIBAVUTIL_VERSION_INT
#define LIBAVUTIL_VERSION_INT
Definition: version.h:85
AVClass
Describe the class of an AVClass context structure.
Definition: log.h:67
NULL
#define NULL
Definition: coverity.c:32
parse_id_header
static int parse_id_header(AVVorbisParseContext *s, const uint8_t *buf, int buf_size)
Definition: vorbis_parser.c:41
VORBIS_FLAG_HEADER
#define VORBIS_FLAG_HEADER
Definition: vorbis_parser.h:44
AVCodecParser::codec_ids
int codec_ids[5]
Definition: avcodec.h:3545
av_default_item_name
const char * av_default_item_name(void *ptr)
Return the context name.
Definition: log.c:235
get_bits1
static unsigned int get_bits1(GetBitContext *s)
Definition: get_bits.h:498
ff_vorbis_parser
AVCodecParser ff_vorbis_parser
vorbis_parser_internal.h
vorbis_parser_class
static const AVClass vorbis_parser_class
Definition: vorbis_parser.c:35
flag
#define flag(name)
Definition: cbs_av1.c:553
i
int i
Definition: input.c:407
log.h
AVCodecContext::extradata
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
Definition: avcodec.h:637
uint8_t
uint8_t
Definition: audio_convert.c:194
av_mallocz
void * av_mallocz(size_t size)
Allocate a memory block with alignment suitable for all memory accesses (including vectors if availab...
Definition: mem.c:237
parser.h
vorbis_parse_init
static int vorbis_parse_init(AVVorbisParseContext *s, const uint8_t *extradata, int extradata_size)
Definition: vorbis_parser.c:184
AVCodecParserContext
Definition: avcodec.h:3377
ret
ret
Definition: filter_design.txt:187
AVClass::class_name
const char * class_name
The name of the class; usually it is the same name as the context structure type to which the AVClass...
Definition: log.h:72
av_vorbis_parse_init
AVVorbisParseContext * av_vorbis_parse_init(const uint8_t *extradata, int extradata_size)
Allocate and initialize the Vorbis parser using headers in the extradata.
Definition: vorbis_parser.c:281
AVCodecContext
main external API structure.
Definition: avcodec.h:536
VORBIS_FLAG_SETUP
#define VORBIS_FLAG_SETUP
Definition: vorbis_parser.h:46
mode
mode
Definition: ebur128.h:83
avpriv_split_xiph_headers
int avpriv_split_xiph_headers(const uint8_t *extradata, int extradata_size, int first_header_size, const uint8_t *header_start[3], int header_len[3])
Split a single extradata buffer into the three headers that most Xiph codecs use.
Definition: xiph.c:24
av_vorbis_parse_reset
void av_vorbis_parse_reset(AVVorbisParseContext *s)
Definition: vorbis_parser.c:270
avpriv_request_sample
#define avpriv_request_sample(...)
Definition: tableprint_vlc.h:39
av_free
#define av_free(p)
Definition: tableprint_vlc.h:34
av_freep
#define av_freep(p)
Definition: tableprint_vlc.h:35
AVCodecParser
Definition: avcodec.h:3544
flags
#define flags(name, subs,...)
Definition: cbs_av1.c:561
av_log
#define av_log(a,...)
Definition: tableprint_vlc.h:28
AVERROR_INVALIDDATA
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
AV_CODEC_ID_VORBIS
@ AV_CODEC_ID_VORBIS
Definition: codec_id.h:429
parse_setup_header
static int parse_setup_header(AVVorbisParseContext *s, const uint8_t *buf, int buf_size)
Definition: vorbis_parser.c:73
AVFormatContext::priv_data
void * priv_data
Format private data.
Definition: avformat.h:1260
av_log2
int av_log2(unsigned v)
Definition: intmath.c:26