yading@10
|
1 /*
|
yading@10
|
2 * Copyright (c) 2002 Mark Hills <mark@pogo.org.uk>
|
yading@10
|
3 *
|
yading@10
|
4 * This file is part of FFmpeg.
|
yading@10
|
5 *
|
yading@10
|
6 * FFmpeg is free software; you can redistribute it and/or
|
yading@10
|
7 * modify it under the terms of the GNU Lesser General Public
|
yading@10
|
8 * License as published by the Free Software Foundation; either
|
yading@10
|
9 * version 2.1 of the License, or (at your option) any later version.
|
yading@10
|
10 *
|
yading@10
|
11 * FFmpeg is distributed in the hope that it will be useful,
|
yading@10
|
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
yading@10
|
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
yading@10
|
14 * Lesser General Public License for more details.
|
yading@10
|
15 *
|
yading@10
|
16 * You should have received a copy of the GNU Lesser General Public
|
yading@10
|
17 * License along with FFmpeg; if not, write to the Free Software
|
yading@10
|
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
yading@10
|
19 */
|
yading@10
|
20
|
yading@10
|
21 #include <vorbis/vorbisenc.h>
|
yading@10
|
22
|
yading@10
|
23 #include "libavutil/avassert.h"
|
yading@10
|
24 #include "libavutil/fifo.h"
|
yading@10
|
25 #include "libavutil/opt.h"
|
yading@10
|
26 #include "avcodec.h"
|
yading@10
|
27 #include "audio_frame_queue.h"
|
yading@10
|
28 #include "internal.h"
|
yading@10
|
29 #include "vorbis.h"
|
yading@10
|
30 #include "vorbis_parser.h"
|
yading@10
|
31
|
yading@10
|
32
|
yading@10
|
33 /* Number of samples the user should send in each call.
|
yading@10
|
34 * This value is used because it is the LCD of all possible frame sizes, so
|
yading@10
|
35 * an output packet will always start at the same point as one of the input
|
yading@10
|
36 * packets.
|
yading@10
|
37 */
|
yading@10
|
38 #define OGGVORBIS_FRAME_SIZE 64
|
yading@10
|
39
|
yading@10
|
40 #define BUFFER_SIZE (1024 * 64)
|
yading@10
|
41
|
yading@10
|
42 typedef struct OggVorbisEncContext {
|
yading@10
|
43 AVClass *av_class; /**< class for AVOptions */
|
yading@10
|
44 AVFrame frame;
|
yading@10
|
45 vorbis_info vi; /**< vorbis_info used during init */
|
yading@10
|
46 vorbis_dsp_state vd; /**< DSP state used for analysis */
|
yading@10
|
47 vorbis_block vb; /**< vorbis_block used for analysis */
|
yading@10
|
48 AVFifoBuffer *pkt_fifo; /**< output packet buffer */
|
yading@10
|
49 int eof; /**< end-of-file flag */
|
yading@10
|
50 int dsp_initialized; /**< vd has been initialized */
|
yading@10
|
51 vorbis_comment vc; /**< VorbisComment info */
|
yading@10
|
52 double iblock; /**< impulse block bias option */
|
yading@10
|
53 VorbisParseContext vp; /**< parse context to get durations */
|
yading@10
|
54 AudioFrameQueue afq; /**< frame queue for timestamps */
|
yading@10
|
55 } OggVorbisEncContext;
|
yading@10
|
56
|
yading@10
|
57 static const AVOption options[] = {
|
yading@10
|
58 { "iblock", "Sets the impulse block bias", offsetof(OggVorbisEncContext, iblock), AV_OPT_TYPE_DOUBLE, { .dbl = 0 }, -15, 0, AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM },
|
yading@10
|
59 { NULL }
|
yading@10
|
60 };
|
yading@10
|
61
|
yading@10
|
62 static const AVCodecDefault defaults[] = {
|
yading@10
|
63 { "b", "0" },
|
yading@10
|
64 { NULL },
|
yading@10
|
65 };
|
yading@10
|
66
|
yading@10
|
67 static const AVClass class = {
|
yading@10
|
68 .class_name = "libvorbis",
|
yading@10
|
69 .item_name = av_default_item_name,
|
yading@10
|
70 .option = options,
|
yading@10
|
71 .version = LIBAVUTIL_VERSION_INT,
|
yading@10
|
72 };
|
yading@10
|
73
|
yading@10
|
74 static int vorbis_error_to_averror(int ov_err)
|
yading@10
|
75 {
|
yading@10
|
76 switch (ov_err) {
|
yading@10
|
77 case OV_EFAULT: return AVERROR_BUG;
|
yading@10
|
78 case OV_EINVAL: return AVERROR(EINVAL);
|
yading@10
|
79 case OV_EIMPL: return AVERROR(EINVAL);
|
yading@10
|
80 default: return AVERROR_UNKNOWN;
|
yading@10
|
81 }
|
yading@10
|
82 }
|
yading@10
|
83
|
yading@10
|
84 static av_cold int oggvorbis_init_encoder(vorbis_info *vi,
|
yading@10
|
85 AVCodecContext *avctx)
|
yading@10
|
86 {
|
yading@10
|
87 OggVorbisEncContext *s = avctx->priv_data;
|
yading@10
|
88 double cfreq;
|
yading@10
|
89 int ret;
|
yading@10
|
90
|
yading@10
|
91 if (avctx->flags & CODEC_FLAG_QSCALE || !avctx->bit_rate) {
|
yading@10
|
92 /* variable bitrate
|
yading@10
|
93 * NOTE: we use the oggenc range of -1 to 10 for global_quality for
|
yading@10
|
94 * user convenience, but libvorbis uses -0.1 to 1.0.
|
yading@10
|
95 */
|
yading@10
|
96 float q = avctx->global_quality / (float)FF_QP2LAMBDA;
|
yading@10
|
97 /* default to 3 if the user did not set quality or bitrate */
|
yading@10
|
98 if (!(avctx->flags & CODEC_FLAG_QSCALE))
|
yading@10
|
99 q = 3.0;
|
yading@10
|
100 if ((ret = vorbis_encode_setup_vbr(vi, avctx->channels,
|
yading@10
|
101 avctx->sample_rate,
|
yading@10
|
102 q / 10.0)))
|
yading@10
|
103 goto error;
|
yading@10
|
104 } else {
|
yading@10
|
105 int minrate = avctx->rc_min_rate > 0 ? avctx->rc_min_rate : -1;
|
yading@10
|
106 int maxrate = avctx->rc_max_rate > 0 ? avctx->rc_max_rate : -1;
|
yading@10
|
107
|
yading@10
|
108 /* average bitrate */
|
yading@10
|
109 if ((ret = vorbis_encode_setup_managed(vi, avctx->channels,
|
yading@10
|
110 avctx->sample_rate, maxrate,
|
yading@10
|
111 avctx->bit_rate, minrate)))
|
yading@10
|
112 goto error;
|
yading@10
|
113
|
yading@10
|
114 /* variable bitrate by estimate, disable slow rate management */
|
yading@10
|
115 if (minrate == -1 && maxrate == -1)
|
yading@10
|
116 if ((ret = vorbis_encode_ctl(vi, OV_ECTL_RATEMANAGE2_SET, NULL)))
|
yading@10
|
117 goto error; /* should not happen */
|
yading@10
|
118 }
|
yading@10
|
119
|
yading@10
|
120 /* cutoff frequency */
|
yading@10
|
121 if (avctx->cutoff > 0) {
|
yading@10
|
122 cfreq = avctx->cutoff / 1000.0;
|
yading@10
|
123 if ((ret = vorbis_encode_ctl(vi, OV_ECTL_LOWPASS_SET, &cfreq)))
|
yading@10
|
124 goto error; /* should not happen */
|
yading@10
|
125 }
|
yading@10
|
126
|
yading@10
|
127 /* impulse block bias */
|
yading@10
|
128 if (s->iblock) {
|
yading@10
|
129 if ((ret = vorbis_encode_ctl(vi, OV_ECTL_IBLOCK_SET, &s->iblock)))
|
yading@10
|
130 goto error;
|
yading@10
|
131 }
|
yading@10
|
132
|
yading@10
|
133 if (avctx->channels == 3 &&
|
yading@10
|
134 avctx->channel_layout != (AV_CH_LAYOUT_STEREO|AV_CH_FRONT_CENTER) ||
|
yading@10
|
135 avctx->channels == 4 &&
|
yading@10
|
136 avctx->channel_layout != AV_CH_LAYOUT_2_2 &&
|
yading@10
|
137 avctx->channel_layout != AV_CH_LAYOUT_QUAD ||
|
yading@10
|
138 avctx->channels == 5 &&
|
yading@10
|
139 avctx->channel_layout != AV_CH_LAYOUT_5POINT0 &&
|
yading@10
|
140 avctx->channel_layout != AV_CH_LAYOUT_5POINT0_BACK ||
|
yading@10
|
141 avctx->channels == 6 &&
|
yading@10
|
142 avctx->channel_layout != AV_CH_LAYOUT_5POINT1 &&
|
yading@10
|
143 avctx->channel_layout != AV_CH_LAYOUT_5POINT1_BACK ||
|
yading@10
|
144 avctx->channels == 7 &&
|
yading@10
|
145 avctx->channel_layout != (AV_CH_LAYOUT_5POINT1|AV_CH_BACK_CENTER) ||
|
yading@10
|
146 avctx->channels == 8 &&
|
yading@10
|
147 avctx->channel_layout != AV_CH_LAYOUT_7POINT1) {
|
yading@10
|
148 if (avctx->channel_layout) {
|
yading@10
|
149 char name[32];
|
yading@10
|
150 av_get_channel_layout_string(name, sizeof(name), avctx->channels,
|
yading@10
|
151 avctx->channel_layout);
|
yading@10
|
152 av_log(avctx, AV_LOG_ERROR, "%s not supported by Vorbis: "
|
yading@10
|
153 "output stream will have incorrect "
|
yading@10
|
154 "channel layout.\n", name);
|
yading@10
|
155 } else {
|
yading@10
|
156 av_log(avctx, AV_LOG_WARNING, "No channel layout specified. The encoder "
|
yading@10
|
157 "will use Vorbis channel layout for "
|
yading@10
|
158 "%d channels.\n", avctx->channels);
|
yading@10
|
159 }
|
yading@10
|
160 }
|
yading@10
|
161
|
yading@10
|
162 if ((ret = vorbis_encode_setup_init(vi)))
|
yading@10
|
163 goto error;
|
yading@10
|
164
|
yading@10
|
165 return 0;
|
yading@10
|
166 error:
|
yading@10
|
167 return vorbis_error_to_averror(ret);
|
yading@10
|
168 }
|
yading@10
|
169
|
yading@10
|
170 /* How many bytes are needed for a buffer of length 'l' */
|
yading@10
|
171 static int xiph_len(int l)
|
yading@10
|
172 {
|
yading@10
|
173 return 1 + l / 255 + l;
|
yading@10
|
174 }
|
yading@10
|
175
|
yading@10
|
176 static av_cold int oggvorbis_encode_close(AVCodecContext *avctx)
|
yading@10
|
177 {
|
yading@10
|
178 OggVorbisEncContext *s = avctx->priv_data;
|
yading@10
|
179
|
yading@10
|
180 /* notify vorbisenc this is EOF */
|
yading@10
|
181 if (s->dsp_initialized)
|
yading@10
|
182 vorbis_analysis_wrote(&s->vd, 0);
|
yading@10
|
183
|
yading@10
|
184 vorbis_block_clear(&s->vb);
|
yading@10
|
185 vorbis_dsp_clear(&s->vd);
|
yading@10
|
186 vorbis_info_clear(&s->vi);
|
yading@10
|
187
|
yading@10
|
188 av_fifo_free(s->pkt_fifo);
|
yading@10
|
189 ff_af_queue_close(&s->afq);
|
yading@10
|
190 av_freep(&avctx->extradata);
|
yading@10
|
191
|
yading@10
|
192 return 0;
|
yading@10
|
193 }
|
yading@10
|
194
|
yading@10
|
195 static av_cold int oggvorbis_encode_init(AVCodecContext *avctx)
|
yading@10
|
196 {
|
yading@10
|
197 OggVorbisEncContext *s = avctx->priv_data;
|
yading@10
|
198 ogg_packet header, header_comm, header_code;
|
yading@10
|
199 uint8_t *p;
|
yading@10
|
200 unsigned int offset;
|
yading@10
|
201 int ret;
|
yading@10
|
202
|
yading@10
|
203 vorbis_info_init(&s->vi);
|
yading@10
|
204 if ((ret = oggvorbis_init_encoder(&s->vi, avctx))) {
|
yading@10
|
205 av_log(avctx, AV_LOG_ERROR, "encoder setup failed\n");
|
yading@10
|
206 goto error;
|
yading@10
|
207 }
|
yading@10
|
208 if ((ret = vorbis_analysis_init(&s->vd, &s->vi))) {
|
yading@10
|
209 av_log(avctx, AV_LOG_ERROR, "analysis init failed\n");
|
yading@10
|
210 ret = vorbis_error_to_averror(ret);
|
yading@10
|
211 goto error;
|
yading@10
|
212 }
|
yading@10
|
213 s->dsp_initialized = 1;
|
yading@10
|
214 if ((ret = vorbis_block_init(&s->vd, &s->vb))) {
|
yading@10
|
215 av_log(avctx, AV_LOG_ERROR, "dsp init failed\n");
|
yading@10
|
216 ret = vorbis_error_to_averror(ret);
|
yading@10
|
217 goto error;
|
yading@10
|
218 }
|
yading@10
|
219
|
yading@10
|
220 vorbis_comment_init(&s->vc);
|
yading@10
|
221 if (!(avctx->flags & CODEC_FLAG_BITEXACT))
|
yading@10
|
222 vorbis_comment_add_tag(&s->vc, "encoder", LIBAVCODEC_IDENT);
|
yading@10
|
223
|
yading@10
|
224 if ((ret = vorbis_analysis_headerout(&s->vd, &s->vc, &header, &header_comm,
|
yading@10
|
225 &header_code))) {
|
yading@10
|
226 ret = vorbis_error_to_averror(ret);
|
yading@10
|
227 goto error;
|
yading@10
|
228 }
|
yading@10
|
229
|
yading@10
|
230 avctx->extradata_size = 1 + xiph_len(header.bytes) +
|
yading@10
|
231 xiph_len(header_comm.bytes) +
|
yading@10
|
232 header_code.bytes;
|
yading@10
|
233 p = avctx->extradata = av_malloc(avctx->extradata_size +
|
yading@10
|
234 FF_INPUT_BUFFER_PADDING_SIZE);
|
yading@10
|
235 if (!p) {
|
yading@10
|
236 ret = AVERROR(ENOMEM);
|
yading@10
|
237 goto error;
|
yading@10
|
238 }
|
yading@10
|
239 p[0] = 2;
|
yading@10
|
240 offset = 1;
|
yading@10
|
241 offset += av_xiphlacing(&p[offset], header.bytes);
|
yading@10
|
242 offset += av_xiphlacing(&p[offset], header_comm.bytes);
|
yading@10
|
243 memcpy(&p[offset], header.packet, header.bytes);
|
yading@10
|
244 offset += header.bytes;
|
yading@10
|
245 memcpy(&p[offset], header_comm.packet, header_comm.bytes);
|
yading@10
|
246 offset += header_comm.bytes;
|
yading@10
|
247 memcpy(&p[offset], header_code.packet, header_code.bytes);
|
yading@10
|
248 offset += header_code.bytes;
|
yading@10
|
249 av_assert0(offset == avctx->extradata_size);
|
yading@10
|
250
|
yading@10
|
251 if ((ret = avpriv_vorbis_parse_extradata(avctx, &s->vp)) < 0) {
|
yading@10
|
252 av_log(avctx, AV_LOG_ERROR, "invalid extradata\n");
|
yading@10
|
253 return ret;
|
yading@10
|
254 }
|
yading@10
|
255
|
yading@10
|
256 vorbis_comment_clear(&s->vc);
|
yading@10
|
257
|
yading@10
|
258 avctx->frame_size = OGGVORBIS_FRAME_SIZE;
|
yading@10
|
259 ff_af_queue_init(avctx, &s->afq);
|
yading@10
|
260
|
yading@10
|
261 s->pkt_fifo = av_fifo_alloc(BUFFER_SIZE);
|
yading@10
|
262 if (!s->pkt_fifo) {
|
yading@10
|
263 ret = AVERROR(ENOMEM);
|
yading@10
|
264 goto error;
|
yading@10
|
265 }
|
yading@10
|
266
|
yading@10
|
267 return 0;
|
yading@10
|
268 error:
|
yading@10
|
269 oggvorbis_encode_close(avctx);
|
yading@10
|
270 return ret;
|
yading@10
|
271 }
|
yading@10
|
272
|
yading@10
|
273 static int oggvorbis_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
|
yading@10
|
274 const AVFrame *frame, int *got_packet_ptr)
|
yading@10
|
275 {
|
yading@10
|
276 OggVorbisEncContext *s = avctx->priv_data;
|
yading@10
|
277 ogg_packet op;
|
yading@10
|
278 int ret, duration;
|
yading@10
|
279
|
yading@10
|
280 /* send samples to libvorbis */
|
yading@10
|
281 if (frame) {
|
yading@10
|
282 const int samples = frame->nb_samples;
|
yading@10
|
283 float **buffer;
|
yading@10
|
284 int c, channels = s->vi.channels;
|
yading@10
|
285
|
yading@10
|
286 buffer = vorbis_analysis_buffer(&s->vd, samples);
|
yading@10
|
287 for (c = 0; c < channels; c++) {
|
yading@10
|
288 int co = (channels > 8) ? c :
|
yading@10
|
289 ff_vorbis_encoding_channel_layout_offsets[channels - 1][c];
|
yading@10
|
290 memcpy(buffer[c], frame->extended_data[co],
|
yading@10
|
291 samples * sizeof(*buffer[c]));
|
yading@10
|
292 }
|
yading@10
|
293 if ((ret = vorbis_analysis_wrote(&s->vd, samples)) < 0) {
|
yading@10
|
294 av_log(avctx, AV_LOG_ERROR, "error in vorbis_analysis_wrote()\n");
|
yading@10
|
295 return vorbis_error_to_averror(ret);
|
yading@10
|
296 }
|
yading@10
|
297 if ((ret = ff_af_queue_add(&s->afq, frame)) < 0)
|
yading@10
|
298 return ret;
|
yading@10
|
299 } else {
|
yading@10
|
300 if (!s->eof)
|
yading@10
|
301 if ((ret = vorbis_analysis_wrote(&s->vd, 0)) < 0) {
|
yading@10
|
302 av_log(avctx, AV_LOG_ERROR, "error in vorbis_analysis_wrote()\n");
|
yading@10
|
303 return vorbis_error_to_averror(ret);
|
yading@10
|
304 }
|
yading@10
|
305 s->eof = 1;
|
yading@10
|
306 }
|
yading@10
|
307
|
yading@10
|
308 /* retrieve available packets from libvorbis */
|
yading@10
|
309 while ((ret = vorbis_analysis_blockout(&s->vd, &s->vb)) == 1) {
|
yading@10
|
310 if ((ret = vorbis_analysis(&s->vb, NULL)) < 0)
|
yading@10
|
311 break;
|
yading@10
|
312 if ((ret = vorbis_bitrate_addblock(&s->vb)) < 0)
|
yading@10
|
313 break;
|
yading@10
|
314
|
yading@10
|
315 /* add any available packets to the output packet buffer */
|
yading@10
|
316 while ((ret = vorbis_bitrate_flushpacket(&s->vd, &op)) == 1) {
|
yading@10
|
317 if (av_fifo_space(s->pkt_fifo) < sizeof(ogg_packet) + op.bytes) {
|
yading@10
|
318 av_log(avctx, AV_LOG_ERROR, "packet buffer is too small\n");
|
yading@10
|
319 return AVERROR_BUG;
|
yading@10
|
320 }
|
yading@10
|
321 av_fifo_generic_write(s->pkt_fifo, &op, sizeof(ogg_packet), NULL);
|
yading@10
|
322 av_fifo_generic_write(s->pkt_fifo, op.packet, op.bytes, NULL);
|
yading@10
|
323 }
|
yading@10
|
324 if (ret < 0) {
|
yading@10
|
325 av_log(avctx, AV_LOG_ERROR, "error getting available packets\n");
|
yading@10
|
326 break;
|
yading@10
|
327 }
|
yading@10
|
328 }
|
yading@10
|
329 if (ret < 0) {
|
yading@10
|
330 av_log(avctx, AV_LOG_ERROR, "error getting available packets\n");
|
yading@10
|
331 return vorbis_error_to_averror(ret);
|
yading@10
|
332 }
|
yading@10
|
333
|
yading@10
|
334 /* check for available packets */
|
yading@10
|
335 if (av_fifo_size(s->pkt_fifo) < sizeof(ogg_packet))
|
yading@10
|
336 return 0;
|
yading@10
|
337
|
yading@10
|
338 av_fifo_generic_read(s->pkt_fifo, &op, sizeof(ogg_packet), NULL);
|
yading@10
|
339
|
yading@10
|
340 if ((ret = ff_alloc_packet2(avctx, avpkt, op.bytes)) < 0)
|
yading@10
|
341 return ret;
|
yading@10
|
342 av_fifo_generic_read(s->pkt_fifo, avpkt->data, op.bytes, NULL);
|
yading@10
|
343
|
yading@10
|
344 avpkt->pts = ff_samples_to_time_base(avctx, op.granulepos);
|
yading@10
|
345
|
yading@10
|
346 duration = avpriv_vorbis_parse_frame(&s->vp, avpkt->data, avpkt->size);
|
yading@10
|
347 if (duration > 0) {
|
yading@10
|
348 /* we do not know encoder delay until we get the first packet from
|
yading@10
|
349 * libvorbis, so we have to update the AudioFrameQueue counts */
|
yading@10
|
350 if (!avctx->delay && s->afq.frames) {
|
yading@10
|
351 avctx->delay = duration;
|
yading@10
|
352 av_assert0(!s->afq.remaining_delay);
|
yading@10
|
353 s->afq.frames->duration += duration;
|
yading@10
|
354 s->afq.frames->pts -= duration;
|
yading@10
|
355 s->afq.remaining_samples += duration;
|
yading@10
|
356 }
|
yading@10
|
357 ff_af_queue_remove(&s->afq, duration, &avpkt->pts, &avpkt->duration);
|
yading@10
|
358 }
|
yading@10
|
359
|
yading@10
|
360 *got_packet_ptr = 1;
|
yading@10
|
361 return 0;
|
yading@10
|
362 }
|
yading@10
|
363
|
yading@10
|
364 AVCodec ff_libvorbis_encoder = {
|
yading@10
|
365 .name = "libvorbis",
|
yading@10
|
366 .type = AVMEDIA_TYPE_AUDIO,
|
yading@10
|
367 .id = AV_CODEC_ID_VORBIS,
|
yading@10
|
368 .priv_data_size = sizeof(OggVorbisEncContext),
|
yading@10
|
369 .init = oggvorbis_encode_init,
|
yading@10
|
370 .encode2 = oggvorbis_encode_frame,
|
yading@10
|
371 .close = oggvorbis_encode_close,
|
yading@10
|
372 .capabilities = CODEC_CAP_DELAY,
|
yading@10
|
373 .sample_fmts = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLTP,
|
yading@10
|
374 AV_SAMPLE_FMT_NONE },
|
yading@10
|
375 .long_name = NULL_IF_CONFIG_SMALL("libvorbis"),
|
yading@10
|
376 .priv_class = &class,
|
yading@10
|
377 .defaults = defaults,
|
yading@10
|
378 };
|