oggparsevorbis.c
Go to the documentation of this file.
1 /**
2  Copyright (C) 2005 Michael Ahlberg, Måns Rullgård
3 
4  Permission is hereby granted, free of charge, to any person
5  obtaining a copy of this software and associated documentation
6  files (the "Software"), to deal in the Software without
7  restriction, including without limitation the rights to use, copy,
8  modify, merge, publish, distribute, sublicense, and/or sell copies
9  of the Software, and to permit persons to whom the Software is
10  furnished to do so, subject to the following conditions:
11 
12  The above copyright notice and this permission notice shall be
13  included in all copies or substantial portions of the Software.
14 
15  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
16  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
17  MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
18  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
19  HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
20  WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21  OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
22  DEALINGS IN THE SOFTWARE.
23 **/
24 
25 #include <stdlib.h>
26 #include "libavutil/avstring.h"
27 #include "libavutil/bswap.h"
28 #include "libavutil/dict.h"
29 #include "libavcodec/get_bits.h"
30 #include "libavcodec/bytestream.h"
32 #include "avformat.h"
33 #include "internal.h"
34 #include "oggdec.h"
35 #include "vorbiscomment.h"
36 
38 {
39  int i, cnum, h, m, s, ms, keylen = strlen(key);
40  AVChapter *chapter = NULL;
41 
42  if (keylen < 9 || sscanf(key, "CHAPTER%02d", &cnum) != 1)
43  return 0;
44 
45  if (keylen == 9) {
46  if (sscanf(val, "%02d:%02d:%02d.%03d", &h, &m, &s, &ms) < 4)
47  return 0;
48 
49  avpriv_new_chapter(as, cnum, (AVRational){1,1000},
50  ms + 1000*(s + 60*(m + 60*h)),
52  av_free(val);
53  } else if (!strcmp(key+9, "NAME")) {
54  for(i = 0; i < as->nb_chapters; i++)
55  if (as->chapters[i]->id == cnum) {
56  chapter = as->chapters[i];
57  break;
58  }
59  if (!chapter)
60  return 0;
61 
62  av_dict_set(&chapter->metadata, "title", val,
64  } else
65  return 0;
66 
67  av_free(key);
68  return 1;
69 }
70 
71 int
73 {
74  const uint8_t *p = buf;
75  const uint8_t *end = buf + size;
76  unsigned n, j;
77  int s;
78 
79  if (size < 8) /* must have vendor_length and user_comment_list_length */
80  return -1;
81 
82  s = bytestream_get_le32(&p);
83 
84  if (end - p - 4 < s || s < 0)
85  return -1;
86 
87  p += s;
88 
89  n = bytestream_get_le32(&p);
90 
91  while (end - p >= 4 && n > 0) {
92  const char *t, *v;
93  int tl, vl;
94 
95  s = bytestream_get_le32(&p);
96 
97  if (end - p < s || s < 0)
98  break;
99 
100  t = p;
101  p += s;
102  n--;
103 
104  v = memchr(t, '=', s);
105  if (!v)
106  continue;
107 
108  tl = v - t;
109  vl = s - tl - 1;
110  v++;
111 
112  if (tl && vl) {
113  char *tt, *ct;
114 
115  tt = av_malloc(tl + 1);
116  ct = av_malloc(vl + 1);
117  if (!tt || !ct) {
118  av_freep(&tt);
119  av_freep(&ct);
120  av_log(as, AV_LOG_WARNING, "out-of-memory error. skipping VorbisComment tag.\n");
121  continue;
122  }
123 
124  for (j = 0; j < tl; j++)
125  tt[j] = av_toupper(t[j]);
126  tt[tl] = 0;
127 
128  memcpy(ct, v, vl);
129  ct[vl] = 0;
130 
131  if (!ogm_chapter(as, tt, ct))
132  av_dict_set(m, tt, ct,
135  }
136  }
137 
138  if (p != end)
139  av_log(as, AV_LOG_INFO, "%ti bytes of comment header remain\n", end-p);
140  if (n > 0)
141  av_log(as, AV_LOG_INFO,
142  "truncated comment header, %i comments not found\n", n);
143 
145 
146  return 0;
147 }
148 
149 
150 /** Parse the vorbis header
151  * Vorbis Identification header from Vorbis_I_spec.html#vorbis-spec-codec
152  * [vorbis_version] = read 32 bits as unsigned integer | Not used
153  * [audio_channels] = read 8 bit integer as unsigned | Used
154  * [audio_sample_rate] = read 32 bits as unsigned integer | Used
155  * [bitrate_maximum] = read 32 bits as signed integer | Not used yet
156  * [bitrate_nominal] = read 32 bits as signed integer | Not used yet
157  * [bitrate_minimum] = read 32 bits as signed integer | Used as bitrate
158  * [blocksize_0] = read 4 bits as unsigned integer | Not Used
159  * [blocksize_1] = read 4 bits as unsigned integer | Not Used
160  * [framing_flag] = read one bit | Not Used
161  * */
162 
164  unsigned int len[3];
165  unsigned char *packet[3];
167  int64_t final_pts;
169 };
170 
171 
172 static unsigned int
174  uint8_t **buf)
175 {
176  int i,offset, len, buf_len;
177  unsigned char *ptr;
178 
179  len = priv->len[0] + priv->len[1] + priv->len[2];
180  buf_len = len + len/255 + 64;
181  ptr = *buf = av_realloc(NULL, buf_len);
182  if (!*buf)
183  return 0;
184  memset(*buf, '\0', buf_len);
185 
186  ptr[0] = 2;
187  offset = 1;
188  offset += av_xiphlacing(&ptr[offset], priv->len[0]);
189  offset += av_xiphlacing(&ptr[offset], priv->len[1]);
190  for (i = 0; i < 3; i++) {
191  memcpy(&ptr[offset], priv->packet[i], priv->len[i]);
192  offset += priv->len[i];
193  av_freep(&priv->packet[i]);
194  }
195  *buf = av_realloc(*buf, offset + FF_INPUT_BUFFER_PADDING_SIZE);
196  return offset;
197 }
198 
199 static void vorbis_cleanup(AVFormatContext *s, int idx)
200 {
201  struct ogg *ogg = s->priv_data;
202  struct ogg_stream *os = ogg->streams + idx;
203  struct oggvorbis_private *priv = os->private;
204  int i;
205  if (os->private)
206  for (i = 0; i < 3; i++)
207  av_freep(&priv->packet[i]);
208 }
209 
210 static int
212 {
213  struct ogg *ogg = s->priv_data;
214  struct ogg_stream *os = ogg->streams + idx;
215  AVStream *st = s->streams[idx];
216  struct oggvorbis_private *priv;
217  int pkt_type = os->buf[os->pstart];
218 
219  if (!(pkt_type & 1))
220  return os->private ? 0 : -1;
221 
222  if (!os->private) {
223  os->private = av_mallocz(sizeof(struct oggvorbis_private));
224  if (!os->private)
225  return -1;
226  }
227 
228  if (os->psize < 1 || pkt_type > 5)
229  return -1;
230 
231  priv = os->private;
232 
233  if (priv->packet[pkt_type>>1])
234  return -1;
235  if (pkt_type > 1 && !priv->packet[0] || pkt_type > 3 && !priv->packet[1])
236  return -1;
237 
238  priv->len[pkt_type >> 1] = os->psize;
239  priv->packet[pkt_type >> 1] = av_mallocz(os->psize);
240  if (!priv->packet[pkt_type >> 1])
241  return AVERROR(ENOMEM);
242  memcpy(priv->packet[pkt_type >> 1], os->buf + os->pstart, os->psize);
243  if (os->buf[os->pstart] == 1) {
244  const uint8_t *p = os->buf + os->pstart + 7; /* skip "\001vorbis" tag */
245  unsigned blocksize, bs0, bs1;
246  int srate;
247  int channels;
248 
249  if (os->psize != 30)
250  return -1;
251 
252  if (bytestream_get_le32(&p) != 0) /* vorbis_version */
253  return -1;
254 
255  channels= bytestream_get_byte(&p);
256  if (st->codec->channels && channels != st->codec->channels) {
257  av_log(s, AV_LOG_ERROR, "Channel change is not supported\n");
258  return AVERROR_PATCHWELCOME;
259  }
260  st->codec->channels = channels;
261  srate = bytestream_get_le32(&p);
262  p += 4; // skip maximum bitrate
263  st->codec->bit_rate = bytestream_get_le32(&p); // nominal bitrate
264  p += 4; // skip minimum bitrate
265 
266  blocksize = bytestream_get_byte(&p);
267  bs0 = blocksize & 15;
268  bs1 = blocksize >> 4;
269 
270  if (bs0 > bs1)
271  return -1;
272  if (bs0 < 6 || bs1 > 13)
273  return -1;
274 
275  if (bytestream_get_byte(&p) != 1) /* framing_flag */
276  return -1;
277 
280 
281  if (srate > 0) {
282  st->codec->sample_rate = srate;
283  avpriv_set_pts_info(st, 64, 1, srate);
284  }
285  } else if (os->buf[os->pstart] == 3) {
286  if (os->psize > 8 &&
287  ff_vorbis_comment(s, &st->metadata, os->buf + os->pstart + 7, os->psize - 8) >= 0) {
288  // drop all metadata we parsed and which is not required by libvorbis
289  unsigned new_len = 7 + 4 + AV_RL32(priv->packet[1] + 7) + 4 + 1;
290  if (new_len >= 16 && new_len < os->psize) {
291  AV_WL32(priv->packet[1] + new_len - 5, 0);
292  priv->packet[1][new_len - 1] = 1;
293  priv->len[1] = new_len;
294  }
295  }
296  } else {
297  int ret;
298  st->codec->extradata_size =
299  fixup_vorbis_headers(s, priv, &st->codec->extradata);
300  if ((ret = avpriv_vorbis_parse_extradata(st->codec, &priv->vp))) {
301  av_freep(&st->codec->extradata);
302  st->codec->extradata_size = 0;
303  return ret;
304  }
305  }
306 
307  return 1;
308 }
309 
310 static int vorbis_packet(AVFormatContext *s, int idx)
311 {
312  struct ogg *ogg = s->priv_data;
313  struct ogg_stream *os = ogg->streams + idx;
314  struct oggvorbis_private *priv = os->private;
315  int duration;
316 
317  /* first packet handling
318  here we parse the duration of each packet in the first page and compare
319  the total duration to the page granule to find the encoder delay and
320  set the first timestamp */
321  if ((!os->lastpts || os->lastpts == AV_NOPTS_VALUE) && !(os->flags & OGG_FLAG_EOS)) {
322  int seg, d;
323  uint8_t *last_pkt = os->buf + os->pstart;
324  uint8_t *next_pkt = last_pkt;
325 
327  duration = 0;
328  seg = os->segp;
329  d = avpriv_vorbis_parse_frame(&priv->vp, last_pkt, 1);
330  if (d < 0) {
332  return 0;
333  }
334  duration += d;
335  last_pkt = next_pkt = next_pkt + os->psize;
336  for (; seg < os->nsegs; seg++) {
337  if (os->segments[seg] < 255) {
338  int d = avpriv_vorbis_parse_frame(&priv->vp, last_pkt, 1);
339  if (d < 0) {
340  duration = os->granule;
341  break;
342  }
343  duration += d;
344  last_pkt = next_pkt + os->segments[seg];
345  }
346  next_pkt += os->segments[seg];
347  }
348  os->lastpts = os->lastdts = os->granule - duration;
349  if(s->streams[idx]->start_time == AV_NOPTS_VALUE) {
350  s->streams[idx]->start_time = FFMAX(os->lastpts, 0);
351  if (s->streams[idx]->duration)
352  s->streams[idx]->duration -= s->streams[idx]->start_time;
353  }
354  priv->final_pts = AV_NOPTS_VALUE;
356  }
357 
358  /* parse packet duration */
359  if (os->psize > 0) {
360  duration = avpriv_vorbis_parse_frame(&priv->vp, os->buf + os->pstart, 1);
361  if (duration < 0) {
363  return 0;
364  }
365  os->pduration = duration;
366  }
367 
368  /* final packet handling
369  here we save the pts of the first packet in the final page, sum up all
370  packet durations in the final page except for the last one, and compare
371  to the page granule to find the duration of the final packet */
372  if (os->flags & OGG_FLAG_EOS) {
373  if (os->lastpts != AV_NOPTS_VALUE) {
374  priv->final_pts = os->lastpts;
375  priv->final_duration = 0;
376  }
377  if (os->segp == os->nsegs)
378  os->pduration = os->granule - priv->final_pts - priv->final_duration;
379  priv->final_duration += os->pduration;
380  }
381 
382  return 0;
383 }
384 
385 const struct ogg_codec ff_vorbis_codec = {
386  .magic = "\001vorbis",
387  .magicsize = 7,
388  .header = vorbis_header,
389  .packet = vorbis_packet,
390  .cleanup= vorbis_cleanup,
391  .nb_header = 3,
392 };
unsigned int nb_chapters
Definition: avformat.h:1089
void * av_mallocz(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:205
float v
const char * s
Definition: avisynth_c.h:668
static int vorbis_header(AVFormatContext *s, int idx)
VorbisParseContext vp
Copyright (C) 2005 Michael Ahlberg, Måns Rullgård.
Definition: oggdec.h:31
unsigned int pflags
Definition: oggdec.h:67
int avpriv_vorbis_parse_frame(VorbisParseContext *s, const uint8_t *buf, int buf_size)
Get the duration for a Vorbis packet.
int ff_vorbis_comment(AVFormatContext *as, AVDictionary **m, const uint8_t *buf, int size)
Parse the vorbis header Vorbis Identification header from Vorbis_I_spec.html::vorbis-spec-codec [vorb...
void avpriv_set_pts_info(AVStream *s, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
static unsigned int fixup_vorbis_headers(AVFormatContext *as, struct oggvorbis_private *priv, uint8_t **buf)
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:154
void avpriv_vorbis_parse_reset(VorbisParseContext *s)
void * av_realloc(void *ptr, size_t size)
Allocate or reallocate a block of memory.
Definition: mem.c:141
int flags
Definition: oggdec.h:76
AVDictionary * metadata
Definition: avformat.h:922
unsigned char * packet[3]
int64_t lastpts
Definition: oggdec.h:72
#define AV_DICT_DONT_STRDUP_KEY
Take ownership of a key that&#39;s been allocated with av_malloc() and children.
Definition: dict.h:69
void av_freep(void *arg)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc() and set the pointer ...
Definition: mem.c:198
AVChapter * avpriv_new_chapter(AVFormatContext *s, int id, AVRational time_base, int64_t start, int64_t end, const char *title)
Add a new chapter.
set threshold d
Format I/O context.
Definition: avformat.h:944
unsigned int psize
Definition: oggdec.h:66
#define AV_WL32(p, darg)
Definition: intreadwrite.h:282
Public dictionary API.
uint8_t
window constants for m
int id
unique ID to identify the chapter
Definition: avformat.h:919
end end
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
AVStream ** streams
Definition: avformat.h:992
Vorbis audio parser.
bitstream reader API header.
static int64_t duration
Definition: ffplay.c:294
static void vorbis_cleanup(AVFormatContext *s, int idx)
const AVMetadataConv ff_vorbiscomment_metadata_conv[]
VorbisComment metadata conversion mapping.
Definition: vorbiscomment.c:33
void av_free(void *ptr)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc(). ...
Definition: mem.c:183
#define OGG_FLAG_EOS
Definition: oggdec.h:109
AVChapter ** chapters
Definition: avformat.h:1090
void av_log(void *avcl, int level, const char *fmt,...)
Definition: log.c:246
static const uint8_t offset[127][2]
Definition: vf_spp.c:70
#define FFMAX(a, b)
Definition: common.h:56
uint8_t segments[255]
Definition: oggdec.h:80
int size
AVCodecContext * codec
Codec context associated with this stream.
Definition: avformat.h:662
#define FF_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
int bit_rate
the average bitrate
uint64_t granule
Definition: oggdec.h:70
#define AV_DICT_DONT_STRDUP_VAL
Take ownership of a value that&#39;s been allocated with av_malloc() and chilren.
Definition: dict.h:72
ret
Definition: avfilter.c:821
unsigned int pstart
Definition: oggdec.h:65
t
Definition: genspecsines3.m:6
struct ogg_stream * streams
Definition: oggdec.h:99
int segp
Definition: oggdec.h:79
static int ogm_chapter(AVFormatContext *as, uint8_t *key, uint8_t *val)
Copyright (C) 2005 Michael Ahlberg, Måns Rullgård.
#define AV_RL32
AVDictionary * metadata
Definition: avformat.h:711
Stream structure.
Definition: avformat.h:643
#define AVERROR_PATCHWELCOME
Not yet implemented in FFmpeg, patches welcome.
Definition: error.h:62
NULL
Definition: eval.c:55
enum AVMediaType codec_type
unsigned int pduration
Definition: oggdec.h:68
int nsegs
Definition: oggdec.h:79
enum AVCodecID codec_id
unsigned int len[3]
int sample_rate
samples per second
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:148
void * buf
Definition: avisynth_c.h:594
void * private
Definition: oggdec.h:87
int av_dict_set(AVDictionary **pm, const char *key, const char *value, int flags)
Set the given entry in *pm, overwriting an existing entry.
Definition: dict.c:62
unsigned int av_xiphlacing(unsigned char *s, unsigned int v)
Encode extradata length to a buffer.
void * av_malloc(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:73
synthesis window for stochastic i
rational number numerator/denominator
Definition: rational.h:43
byte swapping routines
int64_t lastdts
Definition: oggdec.h:73
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFilterBuffer structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Buffer references ownership and permissions
const int8_t * magic
Definition: oggdec.h:32
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:696
static int av_toupper(int c)
Locale-independent conversion of ASCII characters to uppercase.
Definition: avstring.h:206
uint8_t * buf
Definition: oggdec.h:62
Main libavformat public API header.
int64_t start_time
Decoding: pts of the first frame of the stream in presentation order, in stream time base...
Definition: avformat.h:689
static int vorbis_packet(AVFormatContext *s, int idx)
#define AV_PKT_FLAG_CORRUPT
The packet content is corrupted.
void ff_metadata_conv(AVDictionary **pm, const AVMetadataConv *d_conv, const AVMetadataConv *s_conv)
Definition: oggdec.h:98
int channels
number of audio channels
void * priv_data
Format private data.
Definition: avformat.h:964
const struct ogg_codec ff_vorbis_codec
#define AV_LOG_INFO
Definition: log.h:156
int avpriv_vorbis_parse_extradata(AVCodecContext *avctx, VorbisParseContext *s)
Initialize the Vorbis parser using headers in the extradata.
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:190