xwma.c
Go to the documentation of this file.
1 /*
2  * xWMA demuxer
3  * Copyright (c) 2011 Max Horn
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include <inttypes.h>
23 
24 #include "avformat.h"
25 #include "internal.h"
26 #include "riff.h"
27 
28 /*
29  * Demuxer for xWMA, a Microsoft audio container used by XAudio 2.
30  */
31 
32 typedef struct {
33  int64_t data_end;
34 } XWMAContext;
35 
36 static int xwma_probe(AVProbeData *p)
37 {
38  if (!memcmp(p->buf, "RIFF", 4) && !memcmp(p->buf + 8, "XWMA", 4))
39  return AVPROBE_SCORE_MAX;
40  return 0;
41 }
42 
44 {
45  int64_t size;
46  int ret;
47  uint32_t dpds_table_size = 0;
48  uint32_t *dpds_table = 0;
49  unsigned int tag;
50  AVIOContext *pb = s->pb;
51  AVStream *st;
52  XWMAContext *xwma = s->priv_data;
53  int i;
54 
55  /* The following code is mostly copied from wav.c, with some
56  * minor alterations.
57  */
58 
59  /* check RIFF header */
60  tag = avio_rl32(pb);
61  if (tag != MKTAG('R', 'I', 'F', 'F'))
62  return -1;
63  avio_rl32(pb); /* file size */
64  tag = avio_rl32(pb);
65  if (tag != MKTAG('X', 'W', 'M', 'A'))
66  return -1;
67 
68  /* parse fmt header */
69  tag = avio_rl32(pb);
70  if (tag != MKTAG('f', 'm', 't', ' '))
71  return -1;
72  size = avio_rl32(pb);
73  st = avformat_new_stream(s, NULL);
74  if (!st)
75  return AVERROR(ENOMEM);
76 
77  ret = ff_get_wav_header(pb, st->codec, size);
78  if (ret < 0)
79  return ret;
81 
82  /* All xWMA files I have seen contained WMAv2 data. If there are files
83  * using WMA Pro or some other codec, then we need to figure out the right
84  * extradata for that. Thus, ask the user for feedback, but try to go on
85  * anyway.
86  */
87  if (st->codec->codec_id != AV_CODEC_ID_WMAV2) {
88  avpriv_request_sample(s, "Unexpected codec (tag 0x04%x; id %d)",
89  st->codec->codec_tag, st->codec->codec_id);
90  } else {
91  /* In all xWMA files I have seen, there is no extradata. But the WMA
92  * codecs require extradata, so we provide our own fake extradata.
93  *
94  * First, check that there really was no extradata in the header. If
95  * there was, then try to use it, after asking the user to provide a
96  * sample of this unusual file.
97  */
98  if (st->codec->extradata_size != 0) {
99  /* Surprise, surprise: We *did* get some extradata. No idea
100  * if it will work, but just go on and try it, after asking
101  * the user for a sample.
102  */
103  avpriv_request_sample(s, "Unexpected extradata (%d bytes)",
104  st->codec->extradata_size);
105  } else {
106  st->codec->extradata_size = 6;
108  if (!st->codec->extradata)
109  return AVERROR(ENOMEM);
110 
111  /* setup extradata with our experimentally obtained value */
112  st->codec->extradata[4] = 31;
113  }
114  }
115 
116  if (!st->codec->channels) {
117  av_log(s, AV_LOG_WARNING, "Invalid channel count: %d\n",
118  st->codec->channels);
119  return AVERROR_INVALIDDATA;
120  }
121  if (!st->codec->bits_per_coded_sample) {
122  av_log(s, AV_LOG_WARNING, "Invalid bits_per_coded_sample: %d\n",
124  return AVERROR_INVALIDDATA;
125  }
126 
127  /* set the sample rate */
128  avpriv_set_pts_info(st, 64, 1, st->codec->sample_rate);
129 
130  /* parse the remaining RIFF chunks */
131  for (;;) {
132  if (pb->eof_reached)
133  return -1;
134  /* read next chunk tag */
135  tag = avio_rl32(pb);
136  size = avio_rl32(pb);
137  if (tag == MKTAG('d', 'a', 't', 'a')) {
138  /* We assume that the data chunk comes last. */
139  break;
140  } else if (tag == MKTAG('d','p','d','s')) {
141  /* Quoting the MSDN xWMA docs on the dpds chunk: "Contains the
142  * decoded packet cumulative data size array, each element is the
143  * number of bytes accumulated after the corresponding xWMA packet
144  * is decoded in order."
145  *
146  * Each packet has size equal to st->codec->block_align, which in
147  * all cases I saw so far was always 2230. Thus, we can use the
148  * dpds data to compute a seeking index.
149  */
150 
151  /* Error out if there is more than one dpds chunk. */
152  if (dpds_table) {
153  av_log(s, AV_LOG_ERROR, "two dpds chunks present\n");
154  return -1;
155  }
156 
157  /* Compute the number of entries in the dpds chunk. */
158  if (size & 3) { /* Size should be divisible by four */
160  "dpds chunk size %"PRId64" not divisible by 4\n", size);
161  }
162  dpds_table_size = size / 4;
163  if (dpds_table_size == 0 || dpds_table_size >= INT_MAX / 4) {
164  av_log(s, AV_LOG_ERROR,
165  "dpds chunk size %"PRId64" invalid\n", size);
166  return -1;
167  }
168 
169  /* Allocate some temporary storage to keep the dpds data around.
170  * for processing later on.
171  */
172  dpds_table = av_malloc(dpds_table_size * sizeof(uint32_t));
173  if (!dpds_table) {
174  return AVERROR(ENOMEM);
175  }
176 
177  for (i = 0; i < dpds_table_size; ++i) {
178  dpds_table[i] = avio_rl32(pb);
179  size -= 4;
180  }
181  }
182  avio_skip(pb, size);
183  }
184 
185  /* Determine overall data length */
186  if (size < 0)
187  return -1;
188  if (!size) {
189  xwma->data_end = INT64_MAX;
190  } else
191  xwma->data_end = avio_tell(pb) + size;
192 
193 
194  if (dpds_table && dpds_table_size) {
195  int64_t cur_pos;
196  const uint32_t bytes_per_sample
197  = (st->codec->channels * st->codec->bits_per_coded_sample) >> 3;
198 
199  /* Estimate the duration from the total number of output bytes. */
200  const uint64_t total_decoded_bytes = dpds_table[dpds_table_size - 1];
201 
202  if(!bytes_per_sample) {
203  av_log(s, AV_LOG_ERROR, "bytes_per_sample is 0\n");
204  return AVERROR_INVALIDDATA;
205  }
206 
207  st->duration = total_decoded_bytes / bytes_per_sample;
208 
209  /* Use the dpds data to build a seek table. We can only do this after
210  * we know the offset to the data chunk, as we need that to determine
211  * the actual offset to each input block.
212  * Note: If we allowed ourselves to assume that the data chunk always
213  * follows immediately after the dpds block, we could of course guess
214  * the data block's start offset already while reading the dpds chunk.
215  * I decided against that, just in case other chunks ever are
216  * discovered.
217  */
218  cur_pos = avio_tell(pb);
219  for (i = 0; i < dpds_table_size; ++i) {
220  /* From the number of output bytes that would accumulate in the
221  * output buffer after decoding the first (i+1) packets, we compute
222  * an offset / timestamp pair.
223  */
225  cur_pos + (i+1) * st->codec->block_align, /* pos */
226  dpds_table[i] / bytes_per_sample, /* timestamp */
227  st->codec->block_align, /* size */
228  0, /* duration */
230  }
231  } else if (st->codec->bit_rate) {
232  /* No dpds chunk was present (or only an empty one), so estimate
233  * the total duration using the average bits per sample and the
234  * total data length.
235  */
236  st->duration = (size<<3) * st->codec->sample_rate / st->codec->bit_rate;
237  }
238 
239  av_free(dpds_table);
240 
241  return 0;
242 }
243 
245 {
246  int ret, size;
247  int64_t left;
248  AVStream *st;
249  XWMAContext *xwma = s->priv_data;
250 
251  st = s->streams[0];
252 
253  left = xwma->data_end - avio_tell(s->pb);
254  if (left <= 0) {
255  return AVERROR_EOF;
256  }
257 
258  /* read a single block; the default block size is 2230. */
259  size = (st->codec->block_align > 1) ? st->codec->block_align : 2230;
260  size = FFMIN(size, left);
261 
262  ret = av_get_packet(s->pb, pkt, size);
263  if (ret < 0)
264  return ret;
265 
266  pkt->stream_index = 0;
267  return ret;
268 }
269 
271  .name = "xwma",
272  .long_name = NULL_IF_CONFIG_SMALL("Microsoft xWMA"),
273  .priv_data_size = sizeof(XWMAContext),
277 };
void * av_mallocz(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:205
const char * s
Definition: avisynth_c.h:668
Bytestream IO Context.
Definition: avio.h:68
#define AVERROR_INVALIDDATA
Invalid data found when processing input.
Definition: error.h:59
int av_add_index_entry(AVStream *st, int64_t pos, int64_t timestamp, int size, int distance, int flags)
Add an index entry into a sorted list.
void avpriv_set_pts_info(AVStream *s, int pts_wrap_bits, unsigned int pts_num, unsigned int pts_den)
Set the time base and wrapping info for a given stream.
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:154
static int xwma_read_packet(AVFormatContext *s, AVPacket *pkt)
Definition: xwma.c:244
int64_t avio_skip(AVIOContext *s, int64_t offset)
Skip given number of bytes forward.
Definition: aviobuf.c:256
int block_align
number of bytes per packet if constant and known or 0 Used by some WAV based audio codecs...
Format I/O context.
Definition: avformat.h:944
void void avpriv_request_sample(void *avc, const char *msg,...) av_printf_format(2
Log a generic warning message about a missing feature.
int64_t data_end
Definition: xwma.c:33
static AVPacket pkt
Definition: demuxing.c:56
enum AVStreamParseType need_parsing
Definition: avformat.h:811
uint8_t * extradata
some codecs need / can use extradata like Huffman tables.
AVStream * avformat_new_stream(AVFormatContext *s, const AVCodec *c)
Add a new stream to a media file.
AVStream ** streams
Definition: avformat.h:992
uint32_t tag
Definition: movenc.c:894
#define AVERROR_EOF
End of file.
Definition: error.h:55
int av_get_packet(AVIOContext *s, AVPacket *pkt, int size)
Allocate and read the payload of a packet and initialize its fields with default values.
static av_always_inline int64_t avio_tell(AVIOContext *s)
ftell() equivalent for AVIOContext.
Definition: avio.h:248
int bits_per_coded_sample
bits per sample/pixel from the demuxer (needed for huffyuv).
static int xwma_read_header(AVFormatContext *s)
Definition: xwma.c:43
#define AVINDEX_KEYFRAME
Definition: avformat.h:599
void av_free(void *ptr)
Free a memory block which has been allocated with av_malloc(z)() or av_realloc(). ...
Definition: mem.c:183
AVInputFormat ff_xwma_demuxer
Definition: xwma.c:270
unsigned int avio_rl32(AVIOContext *s)
Definition: aviobuf.c:579
int ff_get_wav_header(AVIOContext *pb, AVCodecContext *codec, int size)
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
void av_log(void *avcl, int level, const char *fmt,...)
Definition: log.c:246
static int xwma_probe(AVProbeData *p)
Definition: xwma.c:36
int size
AVCodecContext * codec
Codec context associated with this stream.
Definition: avformat.h:662
unsigned char * buf
Buffer must have AVPROBE_PADDING_SIZE of extra allocated bytes filled with zero.
Definition: avformat.h:336
#define FF_INPUT_BUFFER_PADDING_SIZE
Required number of additionally allocated bytes at the end of the input bitstream for decoding...
int bit_rate
the average bitrate
#define FFMIN(a, b)
Definition: common.h:58
static int read_probe(AVProbeData *pd)
ret
Definition: avfilter.c:821
internal header for RIFF based (de)muxers do NOT include this in end user applications ...
static int read_header(FFV1Context *f)
Definition: ffv1dec.c:517
Stream structure.
Definition: avformat.h:643
NULL
Definition: eval.c:55
enum AVCodecID codec_id
int sample_rate
samples per second
AVIOContext * pb
I/O context.
Definition: avformat.h:977
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:148
unsigned int codec_tag
fourcc (LSB first, so "ABCD" -> (&#39;D&#39;<<24) + (&#39;C&#39;<<16) + (&#39;B&#39;<<8) + &#39;A&#39;).
static int read_packet(AVFormatContext *ctx, AVPacket *pkt)
Definition: libcdio.c:114
void * av_malloc(size_t size)
Allocate a block of size bytes with alignment suitable for all memory accesses (including vectors if ...
Definition: mem.c:73
synthesis window for stochastic i
This structure contains the data a format has to probe a file.
Definition: avformat.h:334
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFilterBuffer structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Buffer references ownership and permissions
int64_t duration
Decoding: duration of the stream, in stream time base.
Definition: avformat.h:696
#define AVPROBE_SCORE_MAX
maximum score, half of that is used for file-extension-based detection
Definition: avformat.h:340
Main libavformat public API header.
int eof_reached
true if eof reached
Definition: avio.h:96
int channels
number of audio channels
void * priv_data
Format private data.
Definition: avformat.h:964
const char * name
A comma separated list of short names for the format.
Definition: avformat.h:461
#define MKTAG(a, b, c, d)
Definition: common.h:282
This structure stores compressed data.