libvo-amrwbenc.c
Go to the documentation of this file.
1 /*
2  * AMR Audio encoder stub
3  * Copyright (c) 2003 the ffmpeg project
4  *
5  * This file is part of FFmpeg.
6  *
7  * FFmpeg is free software; you can redistribute it and/or
8  * modify it under the terms of the GNU Lesser General Public
9  * License as published by the Free Software Foundation; either
10  * version 2.1 of the License, or (at your option) any later version.
11  *
12  * FFmpeg is distributed in the hope that it will be useful,
13  * but WITHOUT ANY WARRANTY; without even the implied warranty of
14  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15  * Lesser General Public License for more details.
16  *
17  * You should have received a copy of the GNU Lesser General Public
18  * License along with FFmpeg; if not, write to the Free Software
19  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20  */
21 
22 #include <vo-amrwbenc/enc_if.h>
23 #include <stdio.h>
24 #include <stdlib.h>
25 
26 #include "libavutil/avstring.h"
27 #include "libavutil/internal.h"
28 #include "libavutil/mem.h"
29 #include "libavutil/opt.h"
30 #include "avcodec.h"
31 #include "internal.h"
32 
33 #define MAX_PACKET_SIZE (1 + (477 + 7) / 8)
34 
35 typedef struct AMRWBContext {
37  void *state;
38  int mode;
40  int allow_dtx;
41 } AMRWBContext;
42 
43 static const AVOption options[] = {
44  { "dtx", "Allow DTX (generate comfort noise)", offsetof(AMRWBContext, allow_dtx), AV_OPT_TYPE_INT, { .i64 = 0 }, 0, 1, AV_OPT_FLAG_AUDIO_PARAM | AV_OPT_FLAG_ENCODING_PARAM },
45  { NULL }
46 };
47 
48 static const AVClass class = {
50 };
51 
52 static int get_wb_bitrate_mode(int bitrate, void *log_ctx)
53 {
54  /* make the correspondance between bitrate and mode */
55  static const int rates[] = { 6600, 8850, 12650, 14250, 15850, 18250,
56  19850, 23050, 23850 };
57  int i, best = -1, min_diff = 0;
58  char log_buf[200];
59 
60  for (i = 0; i < 9; i++) {
61  if (rates[i] == bitrate)
62  return i;
63  if (best < 0 || abs(rates[i] - bitrate) < min_diff) {
64  best = i;
65  min_diff = abs(rates[i] - bitrate);
66  }
67  }
68  /* no bitrate matching exactly, log a warning */
69  snprintf(log_buf, sizeof(log_buf), "bitrate not supported: use one of ");
70  for (i = 0; i < 9; i++)
71  av_strlcatf(log_buf, sizeof(log_buf), "%.2fk, ", rates[i] / 1000.f);
72  av_strlcatf(log_buf, sizeof(log_buf), "using %.2fk", rates[best] / 1000.f);
73  av_log(log_ctx, AV_LOG_WARNING, "%s\n", log_buf);
74 
75  return best;
76 }
77 
79 {
80  AMRWBContext *s = avctx->priv_data;
81 
82  if (avctx->sample_rate != 16000 && avctx->strict_std_compliance > FF_COMPLIANCE_UNOFFICIAL) {
83  av_log(avctx, AV_LOG_ERROR, "Only 16000Hz sample rate supported\n");
84  return AVERROR(ENOSYS);
85  }
86 
87  if (avctx->channels != 1) {
88  av_log(avctx, AV_LOG_ERROR, "Only mono supported\n");
89  return AVERROR(ENOSYS);
90  }
91 
92  s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
93  s->last_bitrate = avctx->bit_rate;
94 
95  avctx->frame_size = 320;
96  avctx->delay = 80;
97 
98  s->state = E_IF_init();
99 
100  return 0;
101 }
102 
104 {
105  AMRWBContext *s = avctx->priv_data;
106 
107  E_IF_exit(s->state);
108  return 0;
109 }
110 
111 static int amr_wb_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
112  const AVFrame *frame, int *got_packet_ptr)
113 {
114  AMRWBContext *s = avctx->priv_data;
115  const int16_t *samples = (const int16_t *)frame->data[0];
116  int size, ret;
117 
118  if ((ret = ff_alloc_packet2(avctx, avpkt, MAX_PACKET_SIZE)) < 0)
119  return ret;
120 
121  if (s->last_bitrate != avctx->bit_rate) {
122  s->mode = get_wb_bitrate_mode(avctx->bit_rate, avctx);
123  s->last_bitrate = avctx->bit_rate;
124  }
125  size = E_IF_encode(s->state, s->mode, samples, avpkt->data, s->allow_dtx);
126  if (size <= 0 || size > MAX_PACKET_SIZE) {
127  av_log(avctx, AV_LOG_ERROR, "Error encoding frame\n");
128  return AVERROR(EINVAL);
129  }
130 
131  if (frame->pts != AV_NOPTS_VALUE)
132  avpkt->pts = frame->pts - ff_samples_to_time_base(avctx, avctx->delay);
133 
134  avpkt->size = size;
135  *got_packet_ptr = 1;
136  return 0;
137 }
138 
140  .name = "libvo_amrwbenc",
141  .type = AVMEDIA_TYPE_AUDIO,
142  .id = AV_CODEC_ID_AMR_WB,
143  .priv_data_size = sizeof(AMRWBContext),
145  .encode2 = amr_wb_encode_frame,
147  .sample_fmts = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_S16,
149  .long_name = NULL_IF_CONFIG_SMALL("Android VisualOn AMR-WB "
150  "(Adaptive Multi-Rate Wide-Band)"),
151  .priv_class = &class,
152 };
AMRWBFrame frame
AMRWB parameters decoded from bitstream.
Definition: amrwbdec.c:48
AVClass * av_class
const char * s
Definition: avisynth_c.h:668
This structure describes decoded (raw) audio or video data.
Definition: frame.h:76
AVOption.
Definition: opt.h:251
av_default_item_name
memory handling functions
static av_cold int init(AVCodecContext *avctx)
Definition: avrndec.c:35
#define AV_LOG_WARNING
Something somehow does not look correct.
Definition: log.h:154
#define AV_OPT_FLAG_AUDIO_PARAM
Definition: opt.h:284
Sinusoidal phase f
static int amr_wb_encode_frame(AVCodecContext *avctx, AVPacket *avpkt, const AVFrame *frame, int *got_packet_ptr)
signed 16 bits
Definition: samplefmt.h:52
initialize output if(nPeaks >3)%at least 3 peaks in spectrum for trying to find f0 nf0peaks
struct AMRWBContext AMRWBContext
#define av_cold
Definition: attributes.h:78
AVOptions.
int64_t pts
Presentation timestamp in time_base units (time when frame should be shown to user).
Definition: frame.h:159
static const AVOption options[]
uint8_t * data
#define AV_OPT_FLAG_ENCODING_PARAM
a generic parameter which can be set by the user for muxing or encoding
Definition: opt.h:281
static const int rates[]
#define NULL_IF_CONFIG_SMALL(x)
Return NULL if CONFIG_SMALL is true, otherwise the argument without modification. ...
void av_log(void *avcl, int level, const char *fmt,...)
Definition: log.c:246
const char * name
Name of the codec implementation.
external API header
int size
common internal API header
static int get_wb_bitrate_mode(int bitrate, void *log_ctx)
int bit_rate
the average bitrate
ret
Definition: avfilter.c:821
LIBAVUTIL_VERSION_INT
Definition: eval.c:55
int ff_alloc_packet2(AVCodecContext *avctx, AVPacket *avpkt, int size)
Check AVPacket size and/or allocate data.
int frame_size
Number of samples per channel in an audio frame.
NULL
Definition: eval.c:55
#define FF_COMPLIANCE_UNOFFICIAL
Allow unofficial extensions.
int sample_rate
samples per second
main external API structure.
static void close(AVCodecParserContext *s)
Definition: h264_parser.c:375
#define AV_LOG_ERROR
Something went wrong and cannot losslessly be recovered.
Definition: log.h:148
#define MAX_PACKET_SIZE
Describe the class of an AVClass context structure.
Definition: log.h:50
synthesis window for stochastic i
size_t av_strlcatf(char *dst, size_t size, const char *fmt,...)
Definition: avstring.c:100
#define snprintf
Definition: snprintf.h:34
Filter the word “frame” indicates either a video frame or a group of audio as stored in an AVFilterBuffer structure Format for each input and each output the list of supported formats For video that means pixel format For audio that means channel sample they are references to shared objects When the negotiation mechanism computes the intersection of the formats supported at each end of a all references to both lists are replaced with a reference to the intersection And when a single format is eventually chosen for a link amongst the remaining all references to the list are updated That means that if a filter requires that its input and output have the same format amongst a supported all it has to do is use a reference to the same list of formats query_formats can leave some formats unset and return AVERROR(EAGAIN) to cause the negotiation mechanism toagain later.That can be used by filters with complex requirements to use the format negotiated on one link to set the formats supported on another.Buffer references ownership and permissions
uint8_t * data[AV_NUM_DATA_POINTERS]
pointer to the picture/channel planes.
Definition: frame.h:87
common internal api header.
AVSampleFormat
Audio Sample Formats.
Definition: samplefmt.h:49
static int amr_wb_encode_close(AVCodecContext *avctx)
static av_cold int amr_wb_encode_init(AVCodecContext *avctx)
int channels
number of audio channels
static enum AVSampleFormat sample_fmts[]
Definition: adpcmenc.c:700
Filter the word “frame” indicates either a video frame or a group of audio samples
static av_always_inline int64_t ff_samples_to_time_base(AVCodecContext *avctx, int64_t samples)
Rescale from sample rate to AVCodecContext.time_base.
This structure stores compressed data.
int delay
Codec delay.
int strict_std_compliance
strictly follow the standard (MPEG4, ...).
int64_t pts
Presentation timestamp in AVStream->time_base units; the time at which the decompressed packet will b...
AVCodec ff_libvo_amrwbenc_encoder
#define AV_NOPTS_VALUE
Undefined timestamp value.
Definition: avutil.h:190