annotate ffmpeg/libavformat/oggparsevorbis.c @ 13:844d341cf643 tip

Back up before ISMIR
author Yading Song <yading.song@eecs.qmul.ac.uk>
date Thu, 31 Oct 2013 13:17:06 +0000
parents f445c3017523
children
rev   line source
yading@11 1 /**
yading@11 2 Copyright (C) 2005 Michael Ahlberg, Måns Rullgård
yading@11 3
yading@11 4 Permission is hereby granted, free of charge, to any person
yading@11 5 obtaining a copy of this software and associated documentation
yading@11 6 files (the "Software"), to deal in the Software without
yading@11 7 restriction, including without limitation the rights to use, copy,
yading@11 8 modify, merge, publish, distribute, sublicense, and/or sell copies
yading@11 9 of the Software, and to permit persons to whom the Software is
yading@11 10 furnished to do so, subject to the following conditions:
yading@11 11
yading@11 12 The above copyright notice and this permission notice shall be
yading@11 13 included in all copies or substantial portions of the Software.
yading@11 14
yading@11 15 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
yading@11 16 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
yading@11 17 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
yading@11 18 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
yading@11 19 HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
yading@11 20 WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
yading@11 21 OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
yading@11 22 DEALINGS IN THE SOFTWARE.
yading@11 23 **/
yading@11 24
yading@11 25 #include <stdlib.h>
yading@11 26 #include "libavutil/avstring.h"
yading@11 27 #include "libavutil/bswap.h"
yading@11 28 #include "libavutil/dict.h"
yading@11 29 #include "libavcodec/get_bits.h"
yading@11 30 #include "libavcodec/bytestream.h"
yading@11 31 #include "libavcodec/vorbis_parser.h"
yading@11 32 #include "avformat.h"
yading@11 33 #include "internal.h"
yading@11 34 #include "oggdec.h"
yading@11 35 #include "vorbiscomment.h"
yading@11 36
yading@11 37 static int ogm_chapter(AVFormatContext *as, uint8_t *key, uint8_t *val)
yading@11 38 {
yading@11 39 int i, cnum, h, m, s, ms, keylen = strlen(key);
yading@11 40 AVChapter *chapter = NULL;
yading@11 41
yading@11 42 if (keylen < 9 || sscanf(key, "CHAPTER%02d", &cnum) != 1)
yading@11 43 return 0;
yading@11 44
yading@11 45 if (keylen == 9) {
yading@11 46 if (sscanf(val, "%02d:%02d:%02d.%03d", &h, &m, &s, &ms) < 4)
yading@11 47 return 0;
yading@11 48
yading@11 49 avpriv_new_chapter(as, cnum, (AVRational){1,1000},
yading@11 50 ms + 1000*(s + 60*(m + 60*h)),
yading@11 51 AV_NOPTS_VALUE, NULL);
yading@11 52 av_free(val);
yading@11 53 } else if (!strcmp(key+9, "NAME")) {
yading@11 54 for(i = 0; i < as->nb_chapters; i++)
yading@11 55 if (as->chapters[i]->id == cnum) {
yading@11 56 chapter = as->chapters[i];
yading@11 57 break;
yading@11 58 }
yading@11 59 if (!chapter)
yading@11 60 return 0;
yading@11 61
yading@11 62 av_dict_set(&chapter->metadata, "title", val,
yading@11 63 AV_DICT_DONT_STRDUP_VAL);
yading@11 64 } else
yading@11 65 return 0;
yading@11 66
yading@11 67 av_free(key);
yading@11 68 return 1;
yading@11 69 }
yading@11 70
yading@11 71 int
yading@11 72 ff_vorbis_comment(AVFormatContext * as, AVDictionary **m, const uint8_t *buf, int size)
yading@11 73 {
yading@11 74 const uint8_t *p = buf;
yading@11 75 const uint8_t *end = buf + size;
yading@11 76 unsigned n, j;
yading@11 77 int s;
yading@11 78
yading@11 79 if (size < 8) /* must have vendor_length and user_comment_list_length */
yading@11 80 return -1;
yading@11 81
yading@11 82 s = bytestream_get_le32(&p);
yading@11 83
yading@11 84 if (end - p - 4 < s || s < 0)
yading@11 85 return -1;
yading@11 86
yading@11 87 p += s;
yading@11 88
yading@11 89 n = bytestream_get_le32(&p);
yading@11 90
yading@11 91 while (end - p >= 4 && n > 0) {
yading@11 92 const char *t, *v;
yading@11 93 int tl, vl;
yading@11 94
yading@11 95 s = bytestream_get_le32(&p);
yading@11 96
yading@11 97 if (end - p < s || s < 0)
yading@11 98 break;
yading@11 99
yading@11 100 t = p;
yading@11 101 p += s;
yading@11 102 n--;
yading@11 103
yading@11 104 v = memchr(t, '=', s);
yading@11 105 if (!v)
yading@11 106 continue;
yading@11 107
yading@11 108 tl = v - t;
yading@11 109 vl = s - tl - 1;
yading@11 110 v++;
yading@11 111
yading@11 112 if (tl && vl) {
yading@11 113 char *tt, *ct;
yading@11 114
yading@11 115 tt = av_malloc(tl + 1);
yading@11 116 ct = av_malloc(vl + 1);
yading@11 117 if (!tt || !ct) {
yading@11 118 av_freep(&tt);
yading@11 119 av_freep(&ct);
yading@11 120 av_log(as, AV_LOG_WARNING, "out-of-memory error. skipping VorbisComment tag.\n");
yading@11 121 continue;
yading@11 122 }
yading@11 123
yading@11 124 for (j = 0; j < tl; j++)
yading@11 125 tt[j] = av_toupper(t[j]);
yading@11 126 tt[tl] = 0;
yading@11 127
yading@11 128 memcpy(ct, v, vl);
yading@11 129 ct[vl] = 0;
yading@11 130
yading@11 131 if (!ogm_chapter(as, tt, ct))
yading@11 132 av_dict_set(m, tt, ct,
yading@11 133 AV_DICT_DONT_STRDUP_KEY |
yading@11 134 AV_DICT_DONT_STRDUP_VAL);
yading@11 135 }
yading@11 136 }
yading@11 137
yading@11 138 if (p != end)
yading@11 139 av_log(as, AV_LOG_INFO, "%ti bytes of comment header remain\n", end-p);
yading@11 140 if (n > 0)
yading@11 141 av_log(as, AV_LOG_INFO,
yading@11 142 "truncated comment header, %i comments not found\n", n);
yading@11 143
yading@11 144 ff_metadata_conv(m, NULL, ff_vorbiscomment_metadata_conv);
yading@11 145
yading@11 146 return 0;
yading@11 147 }
yading@11 148
yading@11 149
yading@11 150 /** Parse the vorbis header
yading@11 151 * Vorbis Identification header from Vorbis_I_spec.html#vorbis-spec-codec
yading@11 152 * [vorbis_version] = read 32 bits as unsigned integer | Not used
yading@11 153 * [audio_channels] = read 8 bit integer as unsigned | Used
yading@11 154 * [audio_sample_rate] = read 32 bits as unsigned integer | Used
yading@11 155 * [bitrate_maximum] = read 32 bits as signed integer | Not used yet
yading@11 156 * [bitrate_nominal] = read 32 bits as signed integer | Not used yet
yading@11 157 * [bitrate_minimum] = read 32 bits as signed integer | Used as bitrate
yading@11 158 * [blocksize_0] = read 4 bits as unsigned integer | Not Used
yading@11 159 * [blocksize_1] = read 4 bits as unsigned integer | Not Used
yading@11 160 * [framing_flag] = read one bit | Not Used
yading@11 161 * */
yading@11 162
yading@11 163 struct oggvorbis_private {
yading@11 164 unsigned int len[3];
yading@11 165 unsigned char *packet[3];
yading@11 166 VorbisParseContext vp;
yading@11 167 int64_t final_pts;
yading@11 168 int final_duration;
yading@11 169 };
yading@11 170
yading@11 171
yading@11 172 static unsigned int
yading@11 173 fixup_vorbis_headers(AVFormatContext * as, struct oggvorbis_private *priv,
yading@11 174 uint8_t **buf)
yading@11 175 {
yading@11 176 int i,offset, len, buf_len;
yading@11 177 unsigned char *ptr;
yading@11 178
yading@11 179 len = priv->len[0] + priv->len[1] + priv->len[2];
yading@11 180 buf_len = len + len/255 + 64;
yading@11 181 ptr = *buf = av_realloc(NULL, buf_len);
yading@11 182 if (!*buf)
yading@11 183 return 0;
yading@11 184 memset(*buf, '\0', buf_len);
yading@11 185
yading@11 186 ptr[0] = 2;
yading@11 187 offset = 1;
yading@11 188 offset += av_xiphlacing(&ptr[offset], priv->len[0]);
yading@11 189 offset += av_xiphlacing(&ptr[offset], priv->len[1]);
yading@11 190 for (i = 0; i < 3; i++) {
yading@11 191 memcpy(&ptr[offset], priv->packet[i], priv->len[i]);
yading@11 192 offset += priv->len[i];
yading@11 193 av_freep(&priv->packet[i]);
yading@11 194 }
yading@11 195 *buf = av_realloc(*buf, offset + FF_INPUT_BUFFER_PADDING_SIZE);
yading@11 196 return offset;
yading@11 197 }
yading@11 198
yading@11 199 static void vorbis_cleanup(AVFormatContext *s, int idx)
yading@11 200 {
yading@11 201 struct ogg *ogg = s->priv_data;
yading@11 202 struct ogg_stream *os = ogg->streams + idx;
yading@11 203 struct oggvorbis_private *priv = os->private;
yading@11 204 int i;
yading@11 205 if (os->private)
yading@11 206 for (i = 0; i < 3; i++)
yading@11 207 av_freep(&priv->packet[i]);
yading@11 208 }
yading@11 209
yading@11 210 static int
yading@11 211 vorbis_header (AVFormatContext * s, int idx)
yading@11 212 {
yading@11 213 struct ogg *ogg = s->priv_data;
yading@11 214 struct ogg_stream *os = ogg->streams + idx;
yading@11 215 AVStream *st = s->streams[idx];
yading@11 216 struct oggvorbis_private *priv;
yading@11 217 int pkt_type = os->buf[os->pstart];
yading@11 218
yading@11 219 if (!(pkt_type & 1))
yading@11 220 return os->private ? 0 : -1;
yading@11 221
yading@11 222 if (!os->private) {
yading@11 223 os->private = av_mallocz(sizeof(struct oggvorbis_private));
yading@11 224 if (!os->private)
yading@11 225 return -1;
yading@11 226 }
yading@11 227
yading@11 228 if (os->psize < 1 || pkt_type > 5)
yading@11 229 return -1;
yading@11 230
yading@11 231 priv = os->private;
yading@11 232
yading@11 233 if (priv->packet[pkt_type>>1])
yading@11 234 return -1;
yading@11 235 if (pkt_type > 1 && !priv->packet[0] || pkt_type > 3 && !priv->packet[1])
yading@11 236 return -1;
yading@11 237
yading@11 238 priv->len[pkt_type >> 1] = os->psize;
yading@11 239 priv->packet[pkt_type >> 1] = av_mallocz(os->psize);
yading@11 240 if (!priv->packet[pkt_type >> 1])
yading@11 241 return AVERROR(ENOMEM);
yading@11 242 memcpy(priv->packet[pkt_type >> 1], os->buf + os->pstart, os->psize);
yading@11 243 if (os->buf[os->pstart] == 1) {
yading@11 244 const uint8_t *p = os->buf + os->pstart + 7; /* skip "\001vorbis" tag */
yading@11 245 unsigned blocksize, bs0, bs1;
yading@11 246 int srate;
yading@11 247 int channels;
yading@11 248
yading@11 249 if (os->psize != 30)
yading@11 250 return -1;
yading@11 251
yading@11 252 if (bytestream_get_le32(&p) != 0) /* vorbis_version */
yading@11 253 return -1;
yading@11 254
yading@11 255 channels= bytestream_get_byte(&p);
yading@11 256 if (st->codec->channels && channels != st->codec->channels) {
yading@11 257 av_log(s, AV_LOG_ERROR, "Channel change is not supported\n");
yading@11 258 return AVERROR_PATCHWELCOME;
yading@11 259 }
yading@11 260 st->codec->channels = channels;
yading@11 261 srate = bytestream_get_le32(&p);
yading@11 262 p += 4; // skip maximum bitrate
yading@11 263 st->codec->bit_rate = bytestream_get_le32(&p); // nominal bitrate
yading@11 264 p += 4; // skip minimum bitrate
yading@11 265
yading@11 266 blocksize = bytestream_get_byte(&p);
yading@11 267 bs0 = blocksize & 15;
yading@11 268 bs1 = blocksize >> 4;
yading@11 269
yading@11 270 if (bs0 > bs1)
yading@11 271 return -1;
yading@11 272 if (bs0 < 6 || bs1 > 13)
yading@11 273 return -1;
yading@11 274
yading@11 275 if (bytestream_get_byte(&p) != 1) /* framing_flag */
yading@11 276 return -1;
yading@11 277
yading@11 278 st->codec->codec_type = AVMEDIA_TYPE_AUDIO;
yading@11 279 st->codec->codec_id = AV_CODEC_ID_VORBIS;
yading@11 280
yading@11 281 if (srate > 0) {
yading@11 282 st->codec->sample_rate = srate;
yading@11 283 avpriv_set_pts_info(st, 64, 1, srate);
yading@11 284 }
yading@11 285 } else if (os->buf[os->pstart] == 3) {
yading@11 286 if (os->psize > 8 &&
yading@11 287 ff_vorbis_comment(s, &st->metadata, os->buf + os->pstart + 7, os->psize - 8) >= 0) {
yading@11 288 // drop all metadata we parsed and which is not required by libvorbis
yading@11 289 unsigned new_len = 7 + 4 + AV_RL32(priv->packet[1] + 7) + 4 + 1;
yading@11 290 if (new_len >= 16 && new_len < os->psize) {
yading@11 291 AV_WL32(priv->packet[1] + new_len - 5, 0);
yading@11 292 priv->packet[1][new_len - 1] = 1;
yading@11 293 priv->len[1] = new_len;
yading@11 294 }
yading@11 295 }
yading@11 296 } else {
yading@11 297 int ret;
yading@11 298 st->codec->extradata_size =
yading@11 299 fixup_vorbis_headers(s, priv, &st->codec->extradata);
yading@11 300 if ((ret = avpriv_vorbis_parse_extradata(st->codec, &priv->vp))) {
yading@11 301 av_freep(&st->codec->extradata);
yading@11 302 st->codec->extradata_size = 0;
yading@11 303 return ret;
yading@11 304 }
yading@11 305 }
yading@11 306
yading@11 307 return 1;
yading@11 308 }
yading@11 309
yading@11 310 static int vorbis_packet(AVFormatContext *s, int idx)
yading@11 311 {
yading@11 312 struct ogg *ogg = s->priv_data;
yading@11 313 struct ogg_stream *os = ogg->streams + idx;
yading@11 314 struct oggvorbis_private *priv = os->private;
yading@11 315 int duration;
yading@11 316
yading@11 317 /* first packet handling
yading@11 318 here we parse the duration of each packet in the first page and compare
yading@11 319 the total duration to the page granule to find the encoder delay and
yading@11 320 set the first timestamp */
yading@11 321 if ((!os->lastpts || os->lastpts == AV_NOPTS_VALUE) && !(os->flags & OGG_FLAG_EOS)) {
yading@11 322 int seg, d;
yading@11 323 uint8_t *last_pkt = os->buf + os->pstart;
yading@11 324 uint8_t *next_pkt = last_pkt;
yading@11 325
yading@11 326 avpriv_vorbis_parse_reset(&priv->vp);
yading@11 327 duration = 0;
yading@11 328 seg = os->segp;
yading@11 329 d = avpriv_vorbis_parse_frame(&priv->vp, last_pkt, 1);
yading@11 330 if (d < 0) {
yading@11 331 os->pflags |= AV_PKT_FLAG_CORRUPT;
yading@11 332 return 0;
yading@11 333 }
yading@11 334 duration += d;
yading@11 335 last_pkt = next_pkt = next_pkt + os->psize;
yading@11 336 for (; seg < os->nsegs; seg++) {
yading@11 337 if (os->segments[seg] < 255) {
yading@11 338 int d = avpriv_vorbis_parse_frame(&priv->vp, last_pkt, 1);
yading@11 339 if (d < 0) {
yading@11 340 duration = os->granule;
yading@11 341 break;
yading@11 342 }
yading@11 343 duration += d;
yading@11 344 last_pkt = next_pkt + os->segments[seg];
yading@11 345 }
yading@11 346 next_pkt += os->segments[seg];
yading@11 347 }
yading@11 348 os->lastpts = os->lastdts = os->granule - duration;
yading@11 349 if(s->streams[idx]->start_time == AV_NOPTS_VALUE) {
yading@11 350 s->streams[idx]->start_time = FFMAX(os->lastpts, 0);
yading@11 351 if (s->streams[idx]->duration)
yading@11 352 s->streams[idx]->duration -= s->streams[idx]->start_time;
yading@11 353 }
yading@11 354 priv->final_pts = AV_NOPTS_VALUE;
yading@11 355 avpriv_vorbis_parse_reset(&priv->vp);
yading@11 356 }
yading@11 357
yading@11 358 /* parse packet duration */
yading@11 359 if (os->psize > 0) {
yading@11 360 duration = avpriv_vorbis_parse_frame(&priv->vp, os->buf + os->pstart, 1);
yading@11 361 if (duration < 0) {
yading@11 362 os->pflags |= AV_PKT_FLAG_CORRUPT;
yading@11 363 return 0;
yading@11 364 }
yading@11 365 os->pduration = duration;
yading@11 366 }
yading@11 367
yading@11 368 /* final packet handling
yading@11 369 here we save the pts of the first packet in the final page, sum up all
yading@11 370 packet durations in the final page except for the last one, and compare
yading@11 371 to the page granule to find the duration of the final packet */
yading@11 372 if (os->flags & OGG_FLAG_EOS) {
yading@11 373 if (os->lastpts != AV_NOPTS_VALUE) {
yading@11 374 priv->final_pts = os->lastpts;
yading@11 375 priv->final_duration = 0;
yading@11 376 }
yading@11 377 if (os->segp == os->nsegs)
yading@11 378 os->pduration = os->granule - priv->final_pts - priv->final_duration;
yading@11 379 priv->final_duration += os->pduration;
yading@11 380 }
yading@11 381
yading@11 382 return 0;
yading@11 383 }
yading@11 384
yading@11 385 const struct ogg_codec ff_vorbis_codec = {
yading@11 386 .magic = "\001vorbis",
yading@11 387 .magicsize = 7,
yading@11 388 .header = vorbis_header,
yading@11 389 .packet = vorbis_packet,
yading@11 390 .cleanup= vorbis_cleanup,
yading@11 391 .nb_header = 3,
yading@11 392 };