yading@10
|
1 /*
|
yading@10
|
2 * Common code between the AC-3 and E-AC-3 decoders
|
yading@10
|
3 * Copyright (c) 2007 Bartlomiej Wolowiec <bartek.wolowiec@gmail.com>
|
yading@10
|
4 *
|
yading@10
|
5 * This file is part of FFmpeg.
|
yading@10
|
6 *
|
yading@10
|
7 * FFmpeg is free software; you can redistribute it and/or
|
yading@10
|
8 * modify it under the terms of the GNU Lesser General Public
|
yading@10
|
9 * License as published by the Free Software Foundation; either
|
yading@10
|
10 * version 2.1 of the License, or (at your option) any later version.
|
yading@10
|
11 *
|
yading@10
|
12 * FFmpeg is distributed in the hope that it will be useful,
|
yading@10
|
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
|
yading@10
|
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
yading@10
|
15 * Lesser General Public License for more details.
|
yading@10
|
16 *
|
yading@10
|
17 * You should have received a copy of the GNU Lesser General Public
|
yading@10
|
18 * License along with FFmpeg; if not, write to the Free Software
|
yading@10
|
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
yading@10
|
20 */
|
yading@10
|
21
|
yading@10
|
22 /**
|
yading@10
|
23 * @file
|
yading@10
|
24 * Common code between the AC-3 and E-AC-3 decoders.
|
yading@10
|
25 *
|
yading@10
|
26 * Summary of MDCT Coefficient Grouping:
|
yading@10
|
27 * The individual MDCT coefficient indices are often referred to in the
|
yading@10
|
28 * (E-)AC-3 specification as frequency bins. These bins are grouped together
|
yading@10
|
29 * into subbands of 12 coefficients each. The subbands are grouped together
|
yading@10
|
30 * into bands as defined in the bitstream by the band structures, which
|
yading@10
|
31 * determine the number of bands and the size of each band. The full spectrum
|
yading@10
|
32 * of 256 frequency bins is divided into 1 DC bin + 21 subbands = 253 bins.
|
yading@10
|
33 * This system of grouping coefficients is used for channel bandwidth, stereo
|
yading@10
|
34 * rematrixing, channel coupling, enhanced coupling, and spectral extension.
|
yading@10
|
35 *
|
yading@10
|
36 * +-+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+-+
|
yading@10
|
37 * |1| |12| | [12|12|12|12] | | | | | | | | | | | | |3|
|
yading@10
|
38 * +-+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+--+-+
|
yading@10
|
39 * ~~~ ~~~~ ~~~~~~~~~~~~~ ~~~
|
yading@10
|
40 * | | | |
|
yading@10
|
41 * | | | 3 unused frequency bins--+
|
yading@10
|
42 * | | |
|
yading@10
|
43 * | | +--1 band containing 4 subbands
|
yading@10
|
44 * | |
|
yading@10
|
45 * | +--1 subband of 12 frequency bins
|
yading@10
|
46 * |
|
yading@10
|
47 * +--DC frequency bin
|
yading@10
|
48 */
|
yading@10
|
49
|
yading@10
|
50 #ifndef AVCODEC_AC3DEC_H
|
yading@10
|
51 #define AVCODEC_AC3DEC_H
|
yading@10
|
52
|
yading@10
|
53 #include "libavutil/float_dsp.h"
|
yading@10
|
54 #include "libavutil/lfg.h"
|
yading@10
|
55 #include "ac3.h"
|
yading@10
|
56 #include "ac3dsp.h"
|
yading@10
|
57 #include "get_bits.h"
|
yading@10
|
58 #include "dsputil.h"
|
yading@10
|
59 #include "fft.h"
|
yading@10
|
60 #include "fmtconvert.h"
|
yading@10
|
61
|
yading@10
|
62 #define AC3_OUTPUT_LFEON 8
|
yading@10
|
63
|
yading@10
|
64 #define SPX_MAX_BANDS 17
|
yading@10
|
65
|
yading@10
|
66 /** Large enough for maximum possible frame size when the specification limit is ignored */
|
yading@10
|
67 #define AC3_FRAME_BUFFER_SIZE 32768
|
yading@10
|
68
|
yading@10
|
69 typedef struct AC3DecodeContext {
|
yading@10
|
70 AVClass *class; ///< class for AVOptions
|
yading@10
|
71 AVCodecContext *avctx; ///< parent context
|
yading@10
|
72 GetBitContext gbc; ///< bitstream reader
|
yading@10
|
73
|
yading@10
|
74 ///@name Bit stream information
|
yading@10
|
75 ///@{
|
yading@10
|
76 int frame_type; ///< frame type (strmtyp)
|
yading@10
|
77 int substreamid; ///< substream identification
|
yading@10
|
78 int frame_size; ///< current frame size, in bytes
|
yading@10
|
79 int bit_rate; ///< stream bit rate, in bits-per-second
|
yading@10
|
80 int sample_rate; ///< sample frequency, in Hz
|
yading@10
|
81 int num_blocks; ///< number of audio blocks
|
yading@10
|
82 int bitstream_mode; ///< bitstream mode (bsmod)
|
yading@10
|
83 int channel_mode; ///< channel mode (acmod)
|
yading@10
|
84 int channel_layout; ///< channel layout
|
yading@10
|
85 int lfe_on; ///< lfe channel in use
|
yading@10
|
86 int channel_map; ///< custom channel map
|
yading@10
|
87 int center_mix_level; ///< Center mix level index
|
yading@10
|
88 int surround_mix_level; ///< Surround mix level index
|
yading@10
|
89 int eac3; ///< indicates if current frame is E-AC-3
|
yading@10
|
90 ///@}
|
yading@10
|
91
|
yading@10
|
92 int preferred_stereo_downmix;
|
yading@10
|
93 float ltrt_center_mix_level;
|
yading@10
|
94 float ltrt_surround_mix_level;
|
yading@10
|
95 float loro_center_mix_level;
|
yading@10
|
96 float loro_surround_mix_level;
|
yading@10
|
97
|
yading@10
|
98 ///@name Frame syntax parameters
|
yading@10
|
99 int snr_offset_strategy; ///< SNR offset strategy (snroffststr)
|
yading@10
|
100 int block_switch_syntax; ///< block switch syntax enabled (blkswe)
|
yading@10
|
101 int dither_flag_syntax; ///< dither flag syntax enabled (dithflage)
|
yading@10
|
102 int bit_allocation_syntax; ///< bit allocation model syntax enabled (bamode)
|
yading@10
|
103 int fast_gain_syntax; ///< fast gain codes enabled (frmfgaincode)
|
yading@10
|
104 int dba_syntax; ///< delta bit allocation syntax enabled (dbaflde)
|
yading@10
|
105 int skip_syntax; ///< skip field syntax enabled (skipflde)
|
yading@10
|
106 ///@}
|
yading@10
|
107
|
yading@10
|
108 ///@name Standard coupling
|
yading@10
|
109 int cpl_in_use[AC3_MAX_BLOCKS]; ///< coupling in use (cplinu)
|
yading@10
|
110 int cpl_strategy_exists[AC3_MAX_BLOCKS];///< coupling strategy exists (cplstre)
|
yading@10
|
111 int channel_in_cpl[AC3_MAX_CHANNELS]; ///< channel in coupling (chincpl)
|
yading@10
|
112 int phase_flags_in_use; ///< phase flags in use (phsflginu)
|
yading@10
|
113 int phase_flags[AC3_MAX_CPL_BANDS]; ///< phase flags (phsflg)
|
yading@10
|
114 int num_cpl_bands; ///< number of coupling bands (ncplbnd)
|
yading@10
|
115 uint8_t cpl_band_sizes[AC3_MAX_CPL_BANDS]; ///< number of coeffs in each coupling band
|
yading@10
|
116 int firstchincpl; ///< first channel in coupling
|
yading@10
|
117 int first_cpl_coords[AC3_MAX_CHANNELS]; ///< first coupling coordinates states (firstcplcos)
|
yading@10
|
118 int cpl_coords[AC3_MAX_CHANNELS][AC3_MAX_CPL_BANDS]; ///< coupling coordinates (cplco)
|
yading@10
|
119 ///@}
|
yading@10
|
120
|
yading@10
|
121 ///@name Spectral extension
|
yading@10
|
122 ///@{
|
yading@10
|
123 int spx_in_use; ///< spectral extension in use (spxinu)
|
yading@10
|
124 uint8_t channel_uses_spx[AC3_MAX_CHANNELS]; ///< channel uses spectral extension (chinspx)
|
yading@10
|
125 int8_t spx_atten_code[AC3_MAX_CHANNELS]; ///< spx attenuation code (spxattencod)
|
yading@10
|
126 int spx_src_start_freq; ///< spx start frequency bin
|
yading@10
|
127 int spx_dst_end_freq; ///< spx end frequency bin
|
yading@10
|
128 int spx_dst_start_freq; ///< spx starting frequency bin for copying (copystartmant)
|
yading@10
|
129 ///< the copy region ends at the start of the spx region.
|
yading@10
|
130 int num_spx_bands; ///< number of spx bands (nspxbnds)
|
yading@10
|
131 uint8_t spx_band_sizes[SPX_MAX_BANDS]; ///< number of bins in each spx band
|
yading@10
|
132 uint8_t first_spx_coords[AC3_MAX_CHANNELS]; ///< first spx coordinates states (firstspxcos)
|
yading@10
|
133 float spx_noise_blend[AC3_MAX_CHANNELS][SPX_MAX_BANDS]; ///< spx noise blending factor (nblendfact)
|
yading@10
|
134 float spx_signal_blend[AC3_MAX_CHANNELS][SPX_MAX_BANDS];///< spx signal blending factor (sblendfact)
|
yading@10
|
135 ///@}
|
yading@10
|
136
|
yading@10
|
137 ///@name Adaptive hybrid transform
|
yading@10
|
138 int channel_uses_aht[AC3_MAX_CHANNELS]; ///< channel AHT in use (chahtinu)
|
yading@10
|
139 int pre_mantissa[AC3_MAX_CHANNELS][AC3_MAX_COEFS][AC3_MAX_BLOCKS]; ///< pre-IDCT mantissas
|
yading@10
|
140 ///@}
|
yading@10
|
141
|
yading@10
|
142 ///@name Channel
|
yading@10
|
143 int fbw_channels; ///< number of full-bandwidth channels
|
yading@10
|
144 int channels; ///< number of total channels
|
yading@10
|
145 int lfe_ch; ///< index of LFE channel
|
yading@10
|
146 float downmix_coeffs[AC3_MAX_CHANNELS][2]; ///< stereo downmix coefficients
|
yading@10
|
147 int downmixed; ///< indicates if coeffs are currently downmixed
|
yading@10
|
148 int output_mode; ///< output channel configuration
|
yading@10
|
149 int out_channels; ///< number of output channels
|
yading@10
|
150 ///@}
|
yading@10
|
151
|
yading@10
|
152 ///@name Dynamic range
|
yading@10
|
153 float dynamic_range[2]; ///< dynamic range
|
yading@10
|
154 float drc_scale; ///< percentage of dynamic range compression to be applied
|
yading@10
|
155 ///@}
|
yading@10
|
156
|
yading@10
|
157 ///@name Bandwidth
|
yading@10
|
158 int start_freq[AC3_MAX_CHANNELS]; ///< start frequency bin (strtmant)
|
yading@10
|
159 int end_freq[AC3_MAX_CHANNELS]; ///< end frequency bin (endmant)
|
yading@10
|
160 ///@}
|
yading@10
|
161
|
yading@10
|
162 ///@name Rematrixing
|
yading@10
|
163 int num_rematrixing_bands; ///< number of rematrixing bands (nrematbnd)
|
yading@10
|
164 int rematrixing_flags[4]; ///< rematrixing flags (rematflg)
|
yading@10
|
165 ///@}
|
yading@10
|
166
|
yading@10
|
167 ///@name Exponents
|
yading@10
|
168 int num_exp_groups[AC3_MAX_CHANNELS]; ///< Number of exponent groups (nexpgrp)
|
yading@10
|
169 int8_t dexps[AC3_MAX_CHANNELS][AC3_MAX_COEFS]; ///< decoded exponents
|
yading@10
|
170 int exp_strategy[AC3_MAX_BLOCKS][AC3_MAX_CHANNELS]; ///< exponent strategies (expstr)
|
yading@10
|
171 ///@}
|
yading@10
|
172
|
yading@10
|
173 ///@name Bit allocation
|
yading@10
|
174 AC3BitAllocParameters bit_alloc_params; ///< bit allocation parameters
|
yading@10
|
175 int first_cpl_leak; ///< first coupling leak state (firstcplleak)
|
yading@10
|
176 int snr_offset[AC3_MAX_CHANNELS]; ///< signal-to-noise ratio offsets (snroffst)
|
yading@10
|
177 int fast_gain[AC3_MAX_CHANNELS]; ///< fast gain values/SMR's (fgain)
|
yading@10
|
178 uint8_t bap[AC3_MAX_CHANNELS][AC3_MAX_COEFS]; ///< bit allocation pointers
|
yading@10
|
179 int16_t psd[AC3_MAX_CHANNELS][AC3_MAX_COEFS]; ///< scaled exponents
|
yading@10
|
180 int16_t band_psd[AC3_MAX_CHANNELS][AC3_CRITICAL_BANDS]; ///< interpolated exponents
|
yading@10
|
181 int16_t mask[AC3_MAX_CHANNELS][AC3_CRITICAL_BANDS]; ///< masking curve values
|
yading@10
|
182 int dba_mode[AC3_MAX_CHANNELS]; ///< delta bit allocation mode
|
yading@10
|
183 int dba_nsegs[AC3_MAX_CHANNELS]; ///< number of delta segments
|
yading@10
|
184 uint8_t dba_offsets[AC3_MAX_CHANNELS][8]; ///< delta segment offsets
|
yading@10
|
185 uint8_t dba_lengths[AC3_MAX_CHANNELS][8]; ///< delta segment lengths
|
yading@10
|
186 uint8_t dba_values[AC3_MAX_CHANNELS][8]; ///< delta values for each segment
|
yading@10
|
187 ///@}
|
yading@10
|
188
|
yading@10
|
189 ///@name Zero-mantissa dithering
|
yading@10
|
190 int dither_flag[AC3_MAX_CHANNELS]; ///< dither flags (dithflg)
|
yading@10
|
191 AVLFG dith_state; ///< for dither generation
|
yading@10
|
192 ///@}
|
yading@10
|
193
|
yading@10
|
194 ///@name IMDCT
|
yading@10
|
195 int block_switch[AC3_MAX_CHANNELS]; ///< block switch flags (blksw)
|
yading@10
|
196 FFTContext imdct_512; ///< for 512 sample IMDCT
|
yading@10
|
197 FFTContext imdct_256; ///< for 256 sample IMDCT
|
yading@10
|
198 ///@}
|
yading@10
|
199
|
yading@10
|
200 ///@name Optimization
|
yading@10
|
201 DSPContext dsp; ///< for optimization
|
yading@10
|
202 AVFloatDSPContext fdsp;
|
yading@10
|
203 AC3DSPContext ac3dsp;
|
yading@10
|
204 FmtConvertContext fmt_conv; ///< optimized conversion functions
|
yading@10
|
205 ///@}
|
yading@10
|
206
|
yading@10
|
207 float *outptr[AC3_MAX_CHANNELS];
|
yading@10
|
208 float *xcfptr[AC3_MAX_CHANNELS];
|
yading@10
|
209 float *dlyptr[AC3_MAX_CHANNELS];
|
yading@10
|
210
|
yading@10
|
211 ///@name Aligned arrays
|
yading@10
|
212 DECLARE_ALIGNED(16, int, fixed_coeffs)[AC3_MAX_CHANNELS][AC3_MAX_COEFS]; ///< fixed-point transform coefficients
|
yading@10
|
213 DECLARE_ALIGNED(32, float, transform_coeffs)[AC3_MAX_CHANNELS][AC3_MAX_COEFS]; ///< transform coefficients
|
yading@10
|
214 DECLARE_ALIGNED(32, float, delay)[AC3_MAX_CHANNELS][AC3_BLOCK_SIZE]; ///< delay - added to the next block
|
yading@10
|
215 DECLARE_ALIGNED(32, float, window)[AC3_BLOCK_SIZE]; ///< window coefficients
|
yading@10
|
216 DECLARE_ALIGNED(32, float, tmp_output)[AC3_BLOCK_SIZE]; ///< temporary storage for output before windowing
|
yading@10
|
217 DECLARE_ALIGNED(32, float, output)[AC3_MAX_CHANNELS][AC3_BLOCK_SIZE]; ///< output after imdct transform and windowing
|
yading@10
|
218 DECLARE_ALIGNED(32, uint8_t, input_buffer)[AC3_FRAME_BUFFER_SIZE + FF_INPUT_BUFFER_PADDING_SIZE]; ///< temp buffer to prevent overread
|
yading@10
|
219 ///@}
|
yading@10
|
220 } AC3DecodeContext;
|
yading@10
|
221
|
yading@10
|
222 /**
|
yading@10
|
223 * Parse the E-AC-3 frame header.
|
yading@10
|
224 * This parses both the bit stream info and audio frame header.
|
yading@10
|
225 */
|
yading@10
|
226 int ff_eac3_parse_header(AC3DecodeContext *s);
|
yading@10
|
227
|
yading@10
|
228 /**
|
yading@10
|
229 * Decode mantissas in a single channel for the entire frame.
|
yading@10
|
230 * This is used when AHT mode is enabled.
|
yading@10
|
231 */
|
yading@10
|
232 void ff_eac3_decode_transform_coeffs_aht_ch(AC3DecodeContext *s, int ch);
|
yading@10
|
233
|
yading@10
|
234 /**
|
yading@10
|
235 * Apply spectral extension to each channel by copying lower frequency
|
yading@10
|
236 * coefficients to higher frequency bins and applying side information to
|
yading@10
|
237 * approximate the original high frequency signal.
|
yading@10
|
238 */
|
yading@10
|
239 void ff_eac3_apply_spectral_extension(AC3DecodeContext *s);
|
yading@10
|
240
|
yading@10
|
241 #endif /* AVCODEC_AC3DEC_H */
|