h264: simplify calls to ff_er_add_slice().
[FFMpeg-mirror/mplayer-patches.git] / libavcodec / ac3dec.c
blob8d9fe5a73c39ab6705b3bc8d83c2d6a4c1e41db0
1 /*
2 * AC-3 Audio Decoder
3 * This code was developed as part of Google Summer of Code 2006.
4 * E-AC-3 support was added as part of Google Summer of Code 2007.
6 * Copyright (c) 2006 Kartikey Mahendra BHATT (bhattkm at gmail dot com)
7 * Copyright (c) 2007-2008 Bartlomiej Wolowiec <bartek.wolowiec@gmail.com>
8 * Copyright (c) 2007 Justin Ruggles <justin.ruggles@gmail.com>
10 * This file is part of Libav.
12 * Libav is free software; you can redistribute it and/or
13 * modify it under the terms of the GNU Lesser General Public
14 * License as published by the Free Software Foundation; either
15 * version 2.1 of the License, or (at your option) any later version.
17 * Libav is distributed in the hope that it will be useful,
18 * but WITHOUT ANY WARRANTY; without even the implied warranty of
19 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
20 * Lesser General Public License for more details.
22 * You should have received a copy of the GNU Lesser General Public
23 * License along with Libav; if not, write to the Free Software
24 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
27 #include <stdio.h>
28 #include <stddef.h>
29 #include <math.h>
30 #include <string.h>
32 #include "libavutil/crc.h"
33 #include "libavutil/opt.h"
34 #include "internal.h"
35 #include "aac_ac3_parser.h"
36 #include "ac3_parser.h"
37 #include "ac3dec.h"
38 #include "ac3dec_data.h"
39 #include "kbdwin.h"
41 /**
42 * table for ungrouping 3 values in 7 bits.
43 * used for exponents and bap=2 mantissas
45 static uint8_t ungroup_3_in_7_bits_tab[128][3];
47 /** tables for ungrouping mantissas */
48 static int b1_mantissas[32][3];
49 static int b2_mantissas[128][3];
50 static int b3_mantissas[8];
51 static int b4_mantissas[128][2];
52 static int b5_mantissas[16];
54 /**
55 * Quantization table: levels for symmetric. bits for asymmetric.
56 * reference: Table 7.18 Mapping of bap to Quantizer
58 static const uint8_t quantization_tab[16] = {
59 0, 3, 5, 7, 11, 15,
60 5, 6, 7, 8, 9, 10, 11, 12, 14, 16
63 /** dynamic range table. converts codes to scale factors. */
64 static float dynamic_range_tab[256];
66 /** Adjustments in dB gain */
67 static const float gain_levels[9] = {
68 LEVEL_PLUS_3DB,
69 LEVEL_PLUS_1POINT5DB,
70 LEVEL_ONE,
71 LEVEL_MINUS_1POINT5DB,
72 LEVEL_MINUS_3DB,
73 LEVEL_MINUS_4POINT5DB,
74 LEVEL_MINUS_6DB,
75 LEVEL_ZERO,
76 LEVEL_MINUS_9DB
79 /**
80 * Table for default stereo downmixing coefficients
81 * reference: Section 7.8.2 Downmixing Into Two Channels
83 static const uint8_t ac3_default_coeffs[8][5][2] = {
84 { { 2, 7 }, { 7, 2 }, },
85 { { 4, 4 }, },
86 { { 2, 7 }, { 7, 2 }, },
87 { { 2, 7 }, { 5, 5 }, { 7, 2 }, },
88 { { 2, 7 }, { 7, 2 }, { 6, 6 }, },
89 { { 2, 7 }, { 5, 5 }, { 7, 2 }, { 8, 8 }, },
90 { { 2, 7 }, { 7, 2 }, { 6, 7 }, { 7, 6 }, },
91 { { 2, 7 }, { 5, 5 }, { 7, 2 }, { 6, 7 }, { 7, 6 }, },
94 /**
95 * Symmetrical Dequantization
96 * reference: Section 7.3.3 Expansion of Mantissas for Symmetrical Quantization
97 * Tables 7.19 to 7.23
99 static inline int
100 symmetric_dequant(int code, int levels)
102 return ((code - (levels >> 1)) << 24) / levels;
106 * Initialize tables at runtime.
108 static av_cold void ac3_tables_init(void)
110 int i;
112 /* generate table for ungrouping 3 values in 7 bits
113 reference: Section 7.1.3 Exponent Decoding */
114 for (i = 0; i < 128; i++) {
115 ungroup_3_in_7_bits_tab[i][0] = i / 25;
116 ungroup_3_in_7_bits_tab[i][1] = (i % 25) / 5;
117 ungroup_3_in_7_bits_tab[i][2] = (i % 25) % 5;
120 /* generate grouped mantissa tables
121 reference: Section 7.3.5 Ungrouping of Mantissas */
122 for (i = 0; i < 32; i++) {
123 /* bap=1 mantissas */
124 b1_mantissas[i][0] = symmetric_dequant(ff_ac3_ungroup_3_in_5_bits_tab[i][0], 3);
125 b1_mantissas[i][1] = symmetric_dequant(ff_ac3_ungroup_3_in_5_bits_tab[i][1], 3);
126 b1_mantissas[i][2] = symmetric_dequant(ff_ac3_ungroup_3_in_5_bits_tab[i][2], 3);
128 for (i = 0; i < 128; i++) {
129 /* bap=2 mantissas */
130 b2_mantissas[i][0] = symmetric_dequant(ungroup_3_in_7_bits_tab[i][0], 5);
131 b2_mantissas[i][1] = symmetric_dequant(ungroup_3_in_7_bits_tab[i][1], 5);
132 b2_mantissas[i][2] = symmetric_dequant(ungroup_3_in_7_bits_tab[i][2], 5);
134 /* bap=4 mantissas */
135 b4_mantissas[i][0] = symmetric_dequant(i / 11, 11);
136 b4_mantissas[i][1] = symmetric_dequant(i % 11, 11);
138 /* generate ungrouped mantissa tables
139 reference: Tables 7.21 and 7.23 */
140 for (i = 0; i < 7; i++) {
141 /* bap=3 mantissas */
142 b3_mantissas[i] = symmetric_dequant(i, 7);
144 for (i = 0; i < 15; i++) {
145 /* bap=5 mantissas */
146 b5_mantissas[i] = symmetric_dequant(i, 15);
149 /* generate dynamic range table
150 reference: Section 7.7.1 Dynamic Range Control */
151 for (i = 0; i < 256; i++) {
152 int v = (i >> 5) - ((i >> 7) << 3) - 5;
153 dynamic_range_tab[i] = powf(2.0f, v) * ((i & 0x1F) | 0x20);
158 * AVCodec initialization
160 static av_cold int ac3_decode_init(AVCodecContext *avctx)
162 AC3DecodeContext *s = avctx->priv_data;
163 int i;
165 s->avctx = avctx;
167 ff_ac3_common_init();
168 ac3_tables_init();
169 ff_mdct_init(&s->imdct_256, 8, 1, 1.0);
170 ff_mdct_init(&s->imdct_512, 9, 1, 1.0);
171 ff_kbd_window_init(s->window, 5.0, 256);
172 ff_dsputil_init(&s->dsp, avctx);
173 avpriv_float_dsp_init(&s->fdsp, avctx->flags & CODEC_FLAG_BITEXACT);
174 ff_ac3dsp_init(&s->ac3dsp, avctx->flags & CODEC_FLAG_BITEXACT);
175 ff_fmt_convert_init(&s->fmt_conv, avctx);
176 av_lfg_init(&s->dith_state, 0);
178 avctx->sample_fmt = AV_SAMPLE_FMT_FLTP;
180 /* allow downmixing to stereo or mono */
181 if (avctx->channels > 0 && avctx->request_channels > 0 &&
182 avctx->request_channels < avctx->channels &&
183 avctx->request_channels <= 2) {
184 avctx->channels = avctx->request_channels;
186 s->downmixed = 1;
188 for (i = 0; i < AC3_MAX_CHANNELS; i++) {
189 s->xcfptr[i] = s->transform_coeffs[i];
190 s->dlyptr[i] = s->delay[i];
193 return 0;
197 * Parse the 'sync info' and 'bit stream info' from the AC-3 bitstream.
198 * GetBitContext within AC3DecodeContext must point to
199 * the start of the synchronized AC-3 bitstream.
201 static int ac3_parse_header(AC3DecodeContext *s)
203 GetBitContext *gbc = &s->gbc;
204 int i;
206 /* read the rest of the bsi. read twice for dual mono mode. */
207 i = !s->channel_mode;
208 do {
209 skip_bits(gbc, 5); // skip dialog normalization
210 if (get_bits1(gbc))
211 skip_bits(gbc, 8); //skip compression
212 if (get_bits1(gbc))
213 skip_bits(gbc, 8); //skip language code
214 if (get_bits1(gbc))
215 skip_bits(gbc, 7); //skip audio production information
216 } while (i--);
218 skip_bits(gbc, 2); //skip copyright bit and original bitstream bit
220 /* skip the timecodes (or extra bitstream information for Alternate Syntax)
221 TODO: read & use the xbsi1 downmix levels */
222 if (get_bits1(gbc))
223 skip_bits(gbc, 14); //skip timecode1 / xbsi1
224 if (get_bits1(gbc))
225 skip_bits(gbc, 14); //skip timecode2 / xbsi2
227 /* skip additional bitstream info */
228 if (get_bits1(gbc)) {
229 i = get_bits(gbc, 6);
230 do {
231 skip_bits(gbc, 8);
232 } while (i--);
235 return 0;
239 * Common function to parse AC-3 or E-AC-3 frame header
241 static int parse_frame_header(AC3DecodeContext *s)
243 AC3HeaderInfo hdr;
244 int err;
246 err = avpriv_ac3_parse_header(&s->gbc, &hdr);
247 if (err)
248 return err;
250 /* get decoding parameters from header info */
251 s->bit_alloc_params.sr_code = hdr.sr_code;
252 s->bitstream_mode = hdr.bitstream_mode;
253 s->channel_mode = hdr.channel_mode;
254 s->channel_layout = hdr.channel_layout;
255 s->lfe_on = hdr.lfe_on;
256 s->bit_alloc_params.sr_shift = hdr.sr_shift;
257 s->sample_rate = hdr.sample_rate;
258 s->bit_rate = hdr.bit_rate;
259 s->channels = hdr.channels;
260 s->fbw_channels = s->channels - s->lfe_on;
261 s->lfe_ch = s->fbw_channels + 1;
262 s->frame_size = hdr.frame_size;
263 s->center_mix_level = hdr.center_mix_level;
264 s->surround_mix_level = hdr.surround_mix_level;
265 s->num_blocks = hdr.num_blocks;
266 s->frame_type = hdr.frame_type;
267 s->substreamid = hdr.substreamid;
269 if (s->lfe_on) {
270 s->start_freq[s->lfe_ch] = 0;
271 s->end_freq[s->lfe_ch] = 7;
272 s->num_exp_groups[s->lfe_ch] = 2;
273 s->channel_in_cpl[s->lfe_ch] = 0;
276 if (hdr.bitstream_id <= 10) {
277 s->eac3 = 0;
278 s->snr_offset_strategy = 2;
279 s->block_switch_syntax = 1;
280 s->dither_flag_syntax = 1;
281 s->bit_allocation_syntax = 1;
282 s->fast_gain_syntax = 0;
283 s->first_cpl_leak = 0;
284 s->dba_syntax = 1;
285 s->skip_syntax = 1;
286 memset(s->channel_uses_aht, 0, sizeof(s->channel_uses_aht));
287 return ac3_parse_header(s);
288 } else if (CONFIG_EAC3_DECODER) {
289 s->eac3 = 1;
290 return ff_eac3_parse_header(s);
291 } else {
292 av_log(s->avctx, AV_LOG_ERROR, "E-AC-3 support not compiled in\n");
293 return -1;
298 * Set stereo downmixing coefficients based on frame header info.
299 * reference: Section 7.8.2 Downmixing Into Two Channels
301 static void set_downmix_coeffs(AC3DecodeContext *s)
303 int i;
304 float cmix = gain_levels[s-> center_mix_level];
305 float smix = gain_levels[s->surround_mix_level];
306 float norm0, norm1;
308 for (i = 0; i < s->fbw_channels; i++) {
309 s->downmix_coeffs[i][0] = gain_levels[ac3_default_coeffs[s->channel_mode][i][0]];
310 s->downmix_coeffs[i][1] = gain_levels[ac3_default_coeffs[s->channel_mode][i][1]];
312 if (s->channel_mode > 1 && s->channel_mode & 1) {
313 s->downmix_coeffs[1][0] = s->downmix_coeffs[1][1] = cmix;
315 if (s->channel_mode == AC3_CHMODE_2F1R || s->channel_mode == AC3_CHMODE_3F1R) {
316 int nf = s->channel_mode - 2;
317 s->downmix_coeffs[nf][0] = s->downmix_coeffs[nf][1] = smix * LEVEL_MINUS_3DB;
319 if (s->channel_mode == AC3_CHMODE_2F2R || s->channel_mode == AC3_CHMODE_3F2R) {
320 int nf = s->channel_mode - 4;
321 s->downmix_coeffs[nf][0] = s->downmix_coeffs[nf+1][1] = smix;
324 /* renormalize */
325 norm0 = norm1 = 0.0;
326 for (i = 0; i < s->fbw_channels; i++) {
327 norm0 += s->downmix_coeffs[i][0];
328 norm1 += s->downmix_coeffs[i][1];
330 norm0 = 1.0f / norm0;
331 norm1 = 1.0f / norm1;
332 for (i = 0; i < s->fbw_channels; i++) {
333 s->downmix_coeffs[i][0] *= norm0;
334 s->downmix_coeffs[i][1] *= norm1;
337 if (s->output_mode == AC3_CHMODE_MONO) {
338 for (i = 0; i < s->fbw_channels; i++)
339 s->downmix_coeffs[i][0] = (s->downmix_coeffs[i][0] +
340 s->downmix_coeffs[i][1]) * LEVEL_MINUS_3DB;
345 * Decode the grouped exponents according to exponent strategy.
346 * reference: Section 7.1.3 Exponent Decoding
348 static int decode_exponents(GetBitContext *gbc, int exp_strategy, int ngrps,
349 uint8_t absexp, int8_t *dexps)
351 int i, j, grp, group_size;
352 int dexp[256];
353 int expacc, prevexp;
355 /* unpack groups */
356 group_size = exp_strategy + (exp_strategy == EXP_D45);
357 for (grp = 0, i = 0; grp < ngrps; grp++) {
358 expacc = get_bits(gbc, 7);
359 dexp[i++] = ungroup_3_in_7_bits_tab[expacc][0];
360 dexp[i++] = ungroup_3_in_7_bits_tab[expacc][1];
361 dexp[i++] = ungroup_3_in_7_bits_tab[expacc][2];
364 /* convert to absolute exps and expand groups */
365 prevexp = absexp;
366 for (i = 0, j = 0; i < ngrps * 3; i++) {
367 prevexp += dexp[i] - 2;
368 if (prevexp > 24U)
369 return -1;
370 switch (group_size) {
371 case 4: dexps[j++] = prevexp;
372 dexps[j++] = prevexp;
373 case 2: dexps[j++] = prevexp;
374 case 1: dexps[j++] = prevexp;
377 return 0;
381 * Generate transform coefficients for each coupled channel in the coupling
382 * range using the coupling coefficients and coupling coordinates.
383 * reference: Section 7.4.3 Coupling Coordinate Format
385 static void calc_transform_coeffs_cpl(AC3DecodeContext *s)
387 int bin, band, ch;
389 bin = s->start_freq[CPL_CH];
390 for (band = 0; band < s->num_cpl_bands; band++) {
391 int band_start = bin;
392 int band_end = bin + s->cpl_band_sizes[band];
393 for (ch = 1; ch <= s->fbw_channels; ch++) {
394 if (s->channel_in_cpl[ch]) {
395 int cpl_coord = s->cpl_coords[ch][band] << 5;
396 for (bin = band_start; bin < band_end; bin++) {
397 s->fixed_coeffs[ch][bin] =
398 MULH(s->fixed_coeffs[CPL_CH][bin] << 4, cpl_coord);
400 if (ch == 2 && s->phase_flags[band]) {
401 for (bin = band_start; bin < band_end; bin++)
402 s->fixed_coeffs[2][bin] = -s->fixed_coeffs[2][bin];
406 bin = band_end;
411 * Grouped mantissas for 3-level 5-level and 11-level quantization
413 typedef struct {
414 int b1_mant[2];
415 int b2_mant[2];
416 int b4_mant;
417 int b1;
418 int b2;
419 int b4;
420 } mant_groups;
423 * Decode the transform coefficients for a particular channel
424 * reference: Section 7.3 Quantization and Decoding of Mantissas
426 static void ac3_decode_transform_coeffs_ch(AC3DecodeContext *s, int ch_index, mant_groups *m)
428 int start_freq = s->start_freq[ch_index];
429 int end_freq = s->end_freq[ch_index];
430 uint8_t *baps = s->bap[ch_index];
431 int8_t *exps = s->dexps[ch_index];
432 int *coeffs = s->fixed_coeffs[ch_index];
433 int dither = (ch_index == CPL_CH) || s->dither_flag[ch_index];
434 GetBitContext *gbc = &s->gbc;
435 int freq;
437 for (freq = start_freq; freq < end_freq; freq++) {
438 int bap = baps[freq];
439 int mantissa;
440 switch (bap) {
441 case 0:
442 /* random noise with approximate range of -0.707 to 0.707 */
443 if (dither)
444 mantissa = (av_lfg_get(&s->dith_state) / 362) - 5932275;
445 else
446 mantissa = 0;
447 break;
448 case 1:
449 if (m->b1) {
450 m->b1--;
451 mantissa = m->b1_mant[m->b1];
452 } else {
453 int bits = get_bits(gbc, 5);
454 mantissa = b1_mantissas[bits][0];
455 m->b1_mant[1] = b1_mantissas[bits][1];
456 m->b1_mant[0] = b1_mantissas[bits][2];
457 m->b1 = 2;
459 break;
460 case 2:
461 if (m->b2) {
462 m->b2--;
463 mantissa = m->b2_mant[m->b2];
464 } else {
465 int bits = get_bits(gbc, 7);
466 mantissa = b2_mantissas[bits][0];
467 m->b2_mant[1] = b2_mantissas[bits][1];
468 m->b2_mant[0] = b2_mantissas[bits][2];
469 m->b2 = 2;
471 break;
472 case 3:
473 mantissa = b3_mantissas[get_bits(gbc, 3)];
474 break;
475 case 4:
476 if (m->b4) {
477 m->b4 = 0;
478 mantissa = m->b4_mant;
479 } else {
480 int bits = get_bits(gbc, 7);
481 mantissa = b4_mantissas[bits][0];
482 m->b4_mant = b4_mantissas[bits][1];
483 m->b4 = 1;
485 break;
486 case 5:
487 mantissa = b5_mantissas[get_bits(gbc, 4)];
488 break;
489 default: /* 6 to 15 */
490 /* Shift mantissa and sign-extend it. */
491 mantissa = get_sbits(gbc, quantization_tab[bap]);
492 mantissa <<= 24 - quantization_tab[bap];
493 break;
495 coeffs[freq] = mantissa >> exps[freq];
500 * Remove random dithering from coupling range coefficients with zero-bit
501 * mantissas for coupled channels which do not use dithering.
502 * reference: Section 7.3.4 Dither for Zero Bit Mantissas (bap=0)
504 static void remove_dithering(AC3DecodeContext *s) {
505 int ch, i;
507 for (ch = 1; ch <= s->fbw_channels; ch++) {
508 if (!s->dither_flag[ch] && s->channel_in_cpl[ch]) {
509 for (i = s->start_freq[CPL_CH]; i < s->end_freq[CPL_CH]; i++) {
510 if (!s->bap[CPL_CH][i])
511 s->fixed_coeffs[ch][i] = 0;
517 static void decode_transform_coeffs_ch(AC3DecodeContext *s, int blk, int ch,
518 mant_groups *m)
520 if (!s->channel_uses_aht[ch]) {
521 ac3_decode_transform_coeffs_ch(s, ch, m);
522 } else {
523 /* if AHT is used, mantissas for all blocks are encoded in the first
524 block of the frame. */
525 int bin;
526 if (!blk && CONFIG_EAC3_DECODER)
527 ff_eac3_decode_transform_coeffs_aht_ch(s, ch);
528 for (bin = s->start_freq[ch]; bin < s->end_freq[ch]; bin++) {
529 s->fixed_coeffs[ch][bin] = s->pre_mantissa[ch][bin][blk] >> s->dexps[ch][bin];
535 * Decode the transform coefficients.
537 static void decode_transform_coeffs(AC3DecodeContext *s, int blk)
539 int ch, end;
540 int got_cplchan = 0;
541 mant_groups m;
543 m.b1 = m.b2 = m.b4 = 0;
545 for (ch = 1; ch <= s->channels; ch++) {
546 /* transform coefficients for full-bandwidth channel */
547 decode_transform_coeffs_ch(s, blk, ch, &m);
548 /* transform coefficients for coupling channel come right after the
549 coefficients for the first coupled channel*/
550 if (s->channel_in_cpl[ch]) {
551 if (!got_cplchan) {
552 decode_transform_coeffs_ch(s, blk, CPL_CH, &m);
553 calc_transform_coeffs_cpl(s);
554 got_cplchan = 1;
556 end = s->end_freq[CPL_CH];
557 } else {
558 end = s->end_freq[ch];
561 s->fixed_coeffs[ch][end] = 0;
562 while (++end < 256);
565 /* zero the dithered coefficients for appropriate channels */
566 remove_dithering(s);
570 * Stereo rematrixing.
571 * reference: Section 7.5.4 Rematrixing : Decoding Technique
573 static void do_rematrixing(AC3DecodeContext *s)
575 int bnd, i;
576 int end, bndend;
578 end = FFMIN(s->end_freq[1], s->end_freq[2]);
580 for (bnd = 0; bnd < s->num_rematrixing_bands; bnd++) {
581 if (s->rematrixing_flags[bnd]) {
582 bndend = FFMIN(end, ff_ac3_rematrix_band_tab[bnd + 1]);
583 for (i = ff_ac3_rematrix_band_tab[bnd]; i < bndend; i++) {
584 int tmp0 = s->fixed_coeffs[1][i];
585 s->fixed_coeffs[1][i] += s->fixed_coeffs[2][i];
586 s->fixed_coeffs[2][i] = tmp0 - s->fixed_coeffs[2][i];
593 * Inverse MDCT Transform.
594 * Convert frequency domain coefficients to time-domain audio samples.
595 * reference: Section 7.9.4 Transformation Equations
597 static inline void do_imdct(AC3DecodeContext *s, int channels)
599 int ch;
601 for (ch = 1; ch <= channels; ch++) {
602 if (s->block_switch[ch]) {
603 int i;
604 float *x = s->tmp_output + 128;
605 for (i = 0; i < 128; i++)
606 x[i] = s->transform_coeffs[ch][2 * i];
607 s->imdct_256.imdct_half(&s->imdct_256, s->tmp_output, x);
608 s->fdsp.vector_fmul_window(s->outptr[ch - 1], s->delay[ch - 1],
609 s->tmp_output, s->window, 128);
610 for (i = 0; i < 128; i++)
611 x[i] = s->transform_coeffs[ch][2 * i + 1];
612 s->imdct_256.imdct_half(&s->imdct_256, s->delay[ch - 1], x);
613 } else {
614 s->imdct_512.imdct_half(&s->imdct_512, s->tmp_output, s->transform_coeffs[ch]);
615 s->fdsp.vector_fmul_window(s->outptr[ch - 1], s->delay[ch - 1],
616 s->tmp_output, s->window, 128);
617 memcpy(s->delay[ch - 1], s->tmp_output + 128, 128 * sizeof(float));
623 * Upmix delay samples from stereo to original channel layout.
625 static void ac3_upmix_delay(AC3DecodeContext *s)
627 int channel_data_size = sizeof(s->delay[0]);
628 switch (s->channel_mode) {
629 case AC3_CHMODE_DUALMONO:
630 case AC3_CHMODE_STEREO:
631 /* upmix mono to stereo */
632 memcpy(s->delay[1], s->delay[0], channel_data_size);
633 break;
634 case AC3_CHMODE_2F2R:
635 memset(s->delay[3], 0, channel_data_size);
636 case AC3_CHMODE_2F1R:
637 memset(s->delay[2], 0, channel_data_size);
638 break;
639 case AC3_CHMODE_3F2R:
640 memset(s->delay[4], 0, channel_data_size);
641 case AC3_CHMODE_3F1R:
642 memset(s->delay[3], 0, channel_data_size);
643 case AC3_CHMODE_3F:
644 memcpy(s->delay[2], s->delay[1], channel_data_size);
645 memset(s->delay[1], 0, channel_data_size);
646 break;
651 * Decode band structure for coupling, spectral extension, or enhanced coupling.
652 * The band structure defines how many subbands are in each band. For each
653 * subband in the range, 1 means it is combined with the previous band, and 0
654 * means that it starts a new band.
656 * @param[in] gbc bit reader context
657 * @param[in] blk block number
658 * @param[in] eac3 flag to indicate E-AC-3
659 * @param[in] ecpl flag to indicate enhanced coupling
660 * @param[in] start_subband subband number for start of range
661 * @param[in] end_subband subband number for end of range
662 * @param[in] default_band_struct default band structure table
663 * @param[out] num_bands number of bands (optionally NULL)
664 * @param[out] band_sizes array containing the number of bins in each band (optionally NULL)
666 static void decode_band_structure(GetBitContext *gbc, int blk, int eac3,
667 int ecpl, int start_subband, int end_subband,
668 const uint8_t *default_band_struct,
669 int *num_bands, uint8_t *band_sizes)
671 int subbnd, bnd, n_subbands, n_bands=0;
672 uint8_t bnd_sz[22];
673 uint8_t coded_band_struct[22];
674 const uint8_t *band_struct;
676 n_subbands = end_subband - start_subband;
678 /* decode band structure from bitstream or use default */
679 if (!eac3 || get_bits1(gbc)) {
680 for (subbnd = 0; subbnd < n_subbands - 1; subbnd++) {
681 coded_band_struct[subbnd] = get_bits1(gbc);
683 band_struct = coded_band_struct;
684 } else if (!blk) {
685 band_struct = &default_band_struct[start_subband+1];
686 } else {
687 /* no change in band structure */
688 return;
691 /* calculate number of bands and band sizes based on band structure.
692 note that the first 4 subbands in enhanced coupling span only 6 bins
693 instead of 12. */
694 if (num_bands || band_sizes ) {
695 n_bands = n_subbands;
696 bnd_sz[0] = ecpl ? 6 : 12;
697 for (bnd = 0, subbnd = 1; subbnd < n_subbands; subbnd++) {
698 int subbnd_size = (ecpl && subbnd < 4) ? 6 : 12;
699 if (band_struct[subbnd - 1]) {
700 n_bands--;
701 bnd_sz[bnd] += subbnd_size;
702 } else {
703 bnd_sz[++bnd] = subbnd_size;
708 /* set optional output params */
709 if (num_bands)
710 *num_bands = n_bands;
711 if (band_sizes)
712 memcpy(band_sizes, bnd_sz, n_bands);
716 * Decode a single audio block from the AC-3 bitstream.
718 static int decode_audio_block(AC3DecodeContext *s, int blk)
720 int fbw_channels = s->fbw_channels;
721 int channel_mode = s->channel_mode;
722 int i, bnd, seg, ch;
723 int different_transforms;
724 int downmix_output;
725 int cpl_in_use;
726 GetBitContext *gbc = &s->gbc;
727 uint8_t bit_alloc_stages[AC3_MAX_CHANNELS] = { 0 };
729 /* block switch flags */
730 different_transforms = 0;
731 if (s->block_switch_syntax) {
732 for (ch = 1; ch <= fbw_channels; ch++) {
733 s->block_switch[ch] = get_bits1(gbc);
734 if (ch > 1 && s->block_switch[ch] != s->block_switch[1])
735 different_transforms = 1;
739 /* dithering flags */
740 if (s->dither_flag_syntax) {
741 for (ch = 1; ch <= fbw_channels; ch++) {
742 s->dither_flag[ch] = get_bits1(gbc);
746 /* dynamic range */
747 i = !s->channel_mode;
748 do {
749 if (get_bits1(gbc)) {
750 s->dynamic_range[i] = ((dynamic_range_tab[get_bits(gbc, 8)] - 1.0) *
751 s->drc_scale) + 1.0;
752 } else if (blk == 0) {
753 s->dynamic_range[i] = 1.0f;
755 } while (i--);
757 /* spectral extension strategy */
758 if (s->eac3 && (!blk || get_bits1(gbc))) {
759 s->spx_in_use = get_bits1(gbc);
760 if (s->spx_in_use) {
761 int dst_start_freq, dst_end_freq, src_start_freq,
762 start_subband, end_subband;
764 /* determine which channels use spx */
765 if (s->channel_mode == AC3_CHMODE_MONO) {
766 s->channel_uses_spx[1] = 1;
767 } else {
768 for (ch = 1; ch <= fbw_channels; ch++)
769 s->channel_uses_spx[ch] = get_bits1(gbc);
772 /* get the frequency bins of the spx copy region and the spx start
773 and end subbands */
774 dst_start_freq = get_bits(gbc, 2);
775 start_subband = get_bits(gbc, 3) + 2;
776 if (start_subband > 7)
777 start_subband += start_subband - 7;
778 end_subband = get_bits(gbc, 3) + 5;
779 if (end_subband > 7)
780 end_subband += end_subband - 7;
781 dst_start_freq = dst_start_freq * 12 + 25;
782 src_start_freq = start_subband * 12 + 25;
783 dst_end_freq = end_subband * 12 + 25;
785 /* check validity of spx ranges */
786 if (start_subband >= end_subband) {
787 av_log(s->avctx, AV_LOG_ERROR, "invalid spectral extension "
788 "range (%d >= %d)\n", start_subband, end_subband);
789 return -1;
791 if (dst_start_freq >= src_start_freq) {
792 av_log(s->avctx, AV_LOG_ERROR, "invalid spectral extension "
793 "copy start bin (%d >= %d)\n", dst_start_freq, src_start_freq);
794 return -1;
797 s->spx_dst_start_freq = dst_start_freq;
798 s->spx_src_start_freq = src_start_freq;
799 s->spx_dst_end_freq = dst_end_freq;
801 decode_band_structure(gbc, blk, s->eac3, 0,
802 start_subband, end_subband,
803 ff_eac3_default_spx_band_struct,
804 &s->num_spx_bands,
805 s->spx_band_sizes);
806 } else {
807 for (ch = 1; ch <= fbw_channels; ch++) {
808 s->channel_uses_spx[ch] = 0;
809 s->first_spx_coords[ch] = 1;
814 /* spectral extension coordinates */
815 if (s->spx_in_use) {
816 for (ch = 1; ch <= fbw_channels; ch++) {
817 if (s->channel_uses_spx[ch]) {
818 if (s->first_spx_coords[ch] || get_bits1(gbc)) {
819 float spx_blend;
820 int bin, master_spx_coord;
822 s->first_spx_coords[ch] = 0;
823 spx_blend = get_bits(gbc, 5) * (1.0f/32);
824 master_spx_coord = get_bits(gbc, 2) * 3;
826 bin = s->spx_src_start_freq;
827 for (bnd = 0; bnd < s->num_spx_bands; bnd++) {
828 int bandsize;
829 int spx_coord_exp, spx_coord_mant;
830 float nratio, sblend, nblend, spx_coord;
832 /* calculate blending factors */
833 bandsize = s->spx_band_sizes[bnd];
834 nratio = ((float)((bin + (bandsize >> 1))) / s->spx_dst_end_freq) - spx_blend;
835 nratio = av_clipf(nratio, 0.0f, 1.0f);
836 nblend = sqrtf(3.0f * nratio); // noise is scaled by sqrt(3)
837 // to give unity variance
838 sblend = sqrtf(1.0f - nratio);
839 bin += bandsize;
841 /* decode spx coordinates */
842 spx_coord_exp = get_bits(gbc, 4);
843 spx_coord_mant = get_bits(gbc, 2);
844 if (spx_coord_exp == 15) spx_coord_mant <<= 1;
845 else spx_coord_mant += 4;
846 spx_coord_mant <<= (25 - spx_coord_exp - master_spx_coord);
847 spx_coord = spx_coord_mant * (1.0f / (1 << 23));
849 /* multiply noise and signal blending factors by spx coordinate */
850 s->spx_noise_blend [ch][bnd] = nblend * spx_coord;
851 s->spx_signal_blend[ch][bnd] = sblend * spx_coord;
854 } else {
855 s->first_spx_coords[ch] = 1;
860 /* coupling strategy */
861 if (s->eac3 ? s->cpl_strategy_exists[blk] : get_bits1(gbc)) {
862 memset(bit_alloc_stages, 3, AC3_MAX_CHANNELS);
863 if (!s->eac3)
864 s->cpl_in_use[blk] = get_bits1(gbc);
865 if (s->cpl_in_use[blk]) {
866 /* coupling in use */
867 int cpl_start_subband, cpl_end_subband;
869 if (channel_mode < AC3_CHMODE_STEREO) {
870 av_log(s->avctx, AV_LOG_ERROR, "coupling not allowed in mono or dual-mono\n");
871 return -1;
874 /* check for enhanced coupling */
875 if (s->eac3 && get_bits1(gbc)) {
876 /* TODO: parse enhanced coupling strategy info */
877 av_log_missing_feature(s->avctx, "Enhanced coupling", 1);
878 return AVERROR_PATCHWELCOME;
881 /* determine which channels are coupled */
882 if (s->eac3 && s->channel_mode == AC3_CHMODE_STEREO) {
883 s->channel_in_cpl[1] = 1;
884 s->channel_in_cpl[2] = 1;
885 } else {
886 for (ch = 1; ch <= fbw_channels; ch++)
887 s->channel_in_cpl[ch] = get_bits1(gbc);
890 /* phase flags in use */
891 if (channel_mode == AC3_CHMODE_STEREO)
892 s->phase_flags_in_use = get_bits1(gbc);
894 /* coupling frequency range */
895 cpl_start_subband = get_bits(gbc, 4);
896 cpl_end_subband = s->spx_in_use ? (s->spx_src_start_freq - 37) / 12 :
897 get_bits(gbc, 4) + 3;
898 if (cpl_start_subband >= cpl_end_subband) {
899 av_log(s->avctx, AV_LOG_ERROR, "invalid coupling range (%d >= %d)\n",
900 cpl_start_subband, cpl_end_subband);
901 return -1;
903 s->start_freq[CPL_CH] = cpl_start_subband * 12 + 37;
904 s->end_freq[CPL_CH] = cpl_end_subband * 12 + 37;
906 decode_band_structure(gbc, blk, s->eac3, 0, cpl_start_subband,
907 cpl_end_subband,
908 ff_eac3_default_cpl_band_struct,
909 &s->num_cpl_bands, s->cpl_band_sizes);
910 } else {
911 /* coupling not in use */
912 for (ch = 1; ch <= fbw_channels; ch++) {
913 s->channel_in_cpl[ch] = 0;
914 s->first_cpl_coords[ch] = 1;
916 s->first_cpl_leak = s->eac3;
917 s->phase_flags_in_use = 0;
919 } else if (!s->eac3) {
920 if (!blk) {
921 av_log(s->avctx, AV_LOG_ERROR, "new coupling strategy must "
922 "be present in block 0\n");
923 return -1;
924 } else {
925 s->cpl_in_use[blk] = s->cpl_in_use[blk-1];
928 cpl_in_use = s->cpl_in_use[blk];
930 /* coupling coordinates */
931 if (cpl_in_use) {
932 int cpl_coords_exist = 0;
934 for (ch = 1; ch <= fbw_channels; ch++) {
935 if (s->channel_in_cpl[ch]) {
936 if ((s->eac3 && s->first_cpl_coords[ch]) || get_bits1(gbc)) {
937 int master_cpl_coord, cpl_coord_exp, cpl_coord_mant;
938 s->first_cpl_coords[ch] = 0;
939 cpl_coords_exist = 1;
940 master_cpl_coord = 3 * get_bits(gbc, 2);
941 for (bnd = 0; bnd < s->num_cpl_bands; bnd++) {
942 cpl_coord_exp = get_bits(gbc, 4);
943 cpl_coord_mant = get_bits(gbc, 4);
944 if (cpl_coord_exp == 15)
945 s->cpl_coords[ch][bnd] = cpl_coord_mant << 22;
946 else
947 s->cpl_coords[ch][bnd] = (cpl_coord_mant + 16) << 21;
948 s->cpl_coords[ch][bnd] >>= (cpl_coord_exp + master_cpl_coord);
950 } else if (!blk) {
951 av_log(s->avctx, AV_LOG_ERROR, "new coupling coordinates must "
952 "be present in block 0\n");
953 return -1;
955 } else {
956 /* channel not in coupling */
957 s->first_cpl_coords[ch] = 1;
960 /* phase flags */
961 if (channel_mode == AC3_CHMODE_STEREO && cpl_coords_exist) {
962 for (bnd = 0; bnd < s->num_cpl_bands; bnd++) {
963 s->phase_flags[bnd] = s->phase_flags_in_use? get_bits1(gbc) : 0;
968 /* stereo rematrixing strategy and band structure */
969 if (channel_mode == AC3_CHMODE_STEREO) {
970 if ((s->eac3 && !blk) || get_bits1(gbc)) {
971 s->num_rematrixing_bands = 4;
972 if (cpl_in_use && s->start_freq[CPL_CH] <= 61) {
973 s->num_rematrixing_bands -= 1 + (s->start_freq[CPL_CH] == 37);
974 } else if (s->spx_in_use && s->spx_src_start_freq <= 61) {
975 s->num_rematrixing_bands--;
977 for (bnd = 0; bnd < s->num_rematrixing_bands; bnd++)
978 s->rematrixing_flags[bnd] = get_bits1(gbc);
979 } else if (!blk) {
980 av_log(s->avctx, AV_LOG_WARNING, "Warning: "
981 "new rematrixing strategy not present in block 0\n");
982 s->num_rematrixing_bands = 0;
986 /* exponent strategies for each channel */
987 for (ch = !cpl_in_use; ch <= s->channels; ch++) {
988 if (!s->eac3)
989 s->exp_strategy[blk][ch] = get_bits(gbc, 2 - (ch == s->lfe_ch));
990 if (s->exp_strategy[blk][ch] != EXP_REUSE)
991 bit_alloc_stages[ch] = 3;
994 /* channel bandwidth */
995 for (ch = 1; ch <= fbw_channels; ch++) {
996 s->start_freq[ch] = 0;
997 if (s->exp_strategy[blk][ch] != EXP_REUSE) {
998 int group_size;
999 int prev = s->end_freq[ch];
1000 if (s->channel_in_cpl[ch])
1001 s->end_freq[ch] = s->start_freq[CPL_CH];
1002 else if (s->channel_uses_spx[ch])
1003 s->end_freq[ch] = s->spx_src_start_freq;
1004 else {
1005 int bandwidth_code = get_bits(gbc, 6);
1006 if (bandwidth_code > 60) {
1007 av_log(s->avctx, AV_LOG_ERROR, "bandwidth code = %d > 60\n", bandwidth_code);
1008 return -1;
1010 s->end_freq[ch] = bandwidth_code * 3 + 73;
1012 group_size = 3 << (s->exp_strategy[blk][ch] - 1);
1013 s->num_exp_groups[ch] = (s->end_freq[ch] + group_size-4) / group_size;
1014 if (blk > 0 && s->end_freq[ch] != prev)
1015 memset(bit_alloc_stages, 3, AC3_MAX_CHANNELS);
1018 if (cpl_in_use && s->exp_strategy[blk][CPL_CH] != EXP_REUSE) {
1019 s->num_exp_groups[CPL_CH] = (s->end_freq[CPL_CH] - s->start_freq[CPL_CH]) /
1020 (3 << (s->exp_strategy[blk][CPL_CH] - 1));
1023 /* decode exponents for each channel */
1024 for (ch = !cpl_in_use; ch <= s->channels; ch++) {
1025 if (s->exp_strategy[blk][ch] != EXP_REUSE) {
1026 s->dexps[ch][0] = get_bits(gbc, 4) << !ch;
1027 if (decode_exponents(gbc, s->exp_strategy[blk][ch],
1028 s->num_exp_groups[ch], s->dexps[ch][0],
1029 &s->dexps[ch][s->start_freq[ch]+!!ch])) {
1030 av_log(s->avctx, AV_LOG_ERROR, "exponent out-of-range\n");
1031 return -1;
1033 if (ch != CPL_CH && ch != s->lfe_ch)
1034 skip_bits(gbc, 2); /* skip gainrng */
1038 /* bit allocation information */
1039 if (s->bit_allocation_syntax) {
1040 if (get_bits1(gbc)) {
1041 s->bit_alloc_params.slow_decay = ff_ac3_slow_decay_tab[get_bits(gbc, 2)] >> s->bit_alloc_params.sr_shift;
1042 s->bit_alloc_params.fast_decay = ff_ac3_fast_decay_tab[get_bits(gbc, 2)] >> s->bit_alloc_params.sr_shift;
1043 s->bit_alloc_params.slow_gain = ff_ac3_slow_gain_tab[get_bits(gbc, 2)];
1044 s->bit_alloc_params.db_per_bit = ff_ac3_db_per_bit_tab[get_bits(gbc, 2)];
1045 s->bit_alloc_params.floor = ff_ac3_floor_tab[get_bits(gbc, 3)];
1046 for (ch = !cpl_in_use; ch <= s->channels; ch++)
1047 bit_alloc_stages[ch] = FFMAX(bit_alloc_stages[ch], 2);
1048 } else if (!blk) {
1049 av_log(s->avctx, AV_LOG_ERROR, "new bit allocation info must "
1050 "be present in block 0\n");
1051 return -1;
1055 /* signal-to-noise ratio offsets and fast gains (signal-to-mask ratios) */
1056 if (!s->eac3 || !blk) {
1057 if (s->snr_offset_strategy && get_bits1(gbc)) {
1058 int snr = 0;
1059 int csnr;
1060 csnr = (get_bits(gbc, 6) - 15) << 4;
1061 for (i = ch = !cpl_in_use; ch <= s->channels; ch++) {
1062 /* snr offset */
1063 if (ch == i || s->snr_offset_strategy == 2)
1064 snr = (csnr + get_bits(gbc, 4)) << 2;
1065 /* run at least last bit allocation stage if snr offset changes */
1066 if (blk && s->snr_offset[ch] != snr) {
1067 bit_alloc_stages[ch] = FFMAX(bit_alloc_stages[ch], 1);
1069 s->snr_offset[ch] = snr;
1071 /* fast gain (normal AC-3 only) */
1072 if (!s->eac3) {
1073 int prev = s->fast_gain[ch];
1074 s->fast_gain[ch] = ff_ac3_fast_gain_tab[get_bits(gbc, 3)];
1075 /* run last 2 bit allocation stages if fast gain changes */
1076 if (blk && prev != s->fast_gain[ch])
1077 bit_alloc_stages[ch] = FFMAX(bit_alloc_stages[ch], 2);
1080 } else if (!s->eac3 && !blk) {
1081 av_log(s->avctx, AV_LOG_ERROR, "new snr offsets must be present in block 0\n");
1082 return -1;
1086 /* fast gain (E-AC-3 only) */
1087 if (s->fast_gain_syntax && get_bits1(gbc)) {
1088 for (ch = !cpl_in_use; ch <= s->channels; ch++) {
1089 int prev = s->fast_gain[ch];
1090 s->fast_gain[ch] = ff_ac3_fast_gain_tab[get_bits(gbc, 3)];
1091 /* run last 2 bit allocation stages if fast gain changes */
1092 if (blk && prev != s->fast_gain[ch])
1093 bit_alloc_stages[ch] = FFMAX(bit_alloc_stages[ch], 2);
1095 } else if (s->eac3 && !blk) {
1096 for (ch = !cpl_in_use; ch <= s->channels; ch++)
1097 s->fast_gain[ch] = ff_ac3_fast_gain_tab[4];
1100 /* E-AC-3 to AC-3 converter SNR offset */
1101 if (s->frame_type == EAC3_FRAME_TYPE_INDEPENDENT && get_bits1(gbc)) {
1102 skip_bits(gbc, 10); // skip converter snr offset
1105 /* coupling leak information */
1106 if (cpl_in_use) {
1107 if (s->first_cpl_leak || get_bits1(gbc)) {
1108 int fl = get_bits(gbc, 3);
1109 int sl = get_bits(gbc, 3);
1110 /* run last 2 bit allocation stages for coupling channel if
1111 coupling leak changes */
1112 if (blk && (fl != s->bit_alloc_params.cpl_fast_leak ||
1113 sl != s->bit_alloc_params.cpl_slow_leak)) {
1114 bit_alloc_stages[CPL_CH] = FFMAX(bit_alloc_stages[CPL_CH], 2);
1116 s->bit_alloc_params.cpl_fast_leak = fl;
1117 s->bit_alloc_params.cpl_slow_leak = sl;
1118 } else if (!s->eac3 && !blk) {
1119 av_log(s->avctx, AV_LOG_ERROR, "new coupling leak info must "
1120 "be present in block 0\n");
1121 return -1;
1123 s->first_cpl_leak = 0;
1126 /* delta bit allocation information */
1127 if (s->dba_syntax && get_bits1(gbc)) {
1128 /* delta bit allocation exists (strategy) */
1129 for (ch = !cpl_in_use; ch <= fbw_channels; ch++) {
1130 s->dba_mode[ch] = get_bits(gbc, 2);
1131 if (s->dba_mode[ch] == DBA_RESERVED) {
1132 av_log(s->avctx, AV_LOG_ERROR, "delta bit allocation strategy reserved\n");
1133 return -1;
1135 bit_alloc_stages[ch] = FFMAX(bit_alloc_stages[ch], 2);
1137 /* channel delta offset, len and bit allocation */
1138 for (ch = !cpl_in_use; ch <= fbw_channels; ch++) {
1139 if (s->dba_mode[ch] == DBA_NEW) {
1140 s->dba_nsegs[ch] = get_bits(gbc, 3) + 1;
1141 for (seg = 0; seg < s->dba_nsegs[ch]; seg++) {
1142 s->dba_offsets[ch][seg] = get_bits(gbc, 5);
1143 s->dba_lengths[ch][seg] = get_bits(gbc, 4);
1144 s->dba_values[ch][seg] = get_bits(gbc, 3);
1146 /* run last 2 bit allocation stages if new dba values */
1147 bit_alloc_stages[ch] = FFMAX(bit_alloc_stages[ch], 2);
1150 } else if (blk == 0) {
1151 for (ch = 0; ch <= s->channels; ch++) {
1152 s->dba_mode[ch] = DBA_NONE;
1156 /* Bit allocation */
1157 for (ch = !cpl_in_use; ch <= s->channels; ch++) {
1158 if (bit_alloc_stages[ch] > 2) {
1159 /* Exponent mapping into PSD and PSD integration */
1160 ff_ac3_bit_alloc_calc_psd(s->dexps[ch],
1161 s->start_freq[ch], s->end_freq[ch],
1162 s->psd[ch], s->band_psd[ch]);
1164 if (bit_alloc_stages[ch] > 1) {
1165 /* Compute excitation function, Compute masking curve, and
1166 Apply delta bit allocation */
1167 if (ff_ac3_bit_alloc_calc_mask(&s->bit_alloc_params, s->band_psd[ch],
1168 s->start_freq[ch], s->end_freq[ch],
1169 s->fast_gain[ch], (ch == s->lfe_ch),
1170 s->dba_mode[ch], s->dba_nsegs[ch],
1171 s->dba_offsets[ch], s->dba_lengths[ch],
1172 s->dba_values[ch], s->mask[ch])) {
1173 av_log(s->avctx, AV_LOG_ERROR, "error in bit allocation\n");
1174 return -1;
1177 if (bit_alloc_stages[ch] > 0) {
1178 /* Compute bit allocation */
1179 const uint8_t *bap_tab = s->channel_uses_aht[ch] ?
1180 ff_eac3_hebap_tab : ff_ac3_bap_tab;
1181 s->ac3dsp.bit_alloc_calc_bap(s->mask[ch], s->psd[ch],
1182 s->start_freq[ch], s->end_freq[ch],
1183 s->snr_offset[ch],
1184 s->bit_alloc_params.floor,
1185 bap_tab, s->bap[ch]);
1189 /* unused dummy data */
1190 if (s->skip_syntax && get_bits1(gbc)) {
1191 int skipl = get_bits(gbc, 9);
1192 while (skipl--)
1193 skip_bits(gbc, 8);
1196 /* unpack the transform coefficients
1197 this also uncouples channels if coupling is in use. */
1198 decode_transform_coeffs(s, blk);
1200 /* TODO: generate enhanced coupling coordinates and uncouple */
1202 /* recover coefficients if rematrixing is in use */
1203 if (s->channel_mode == AC3_CHMODE_STEREO)
1204 do_rematrixing(s);
1206 /* apply scaling to coefficients (headroom, dynrng) */
1207 for (ch = 1; ch <= s->channels; ch++) {
1208 float gain = 1.0 / 4194304.0f;
1209 if (s->channel_mode == AC3_CHMODE_DUALMONO) {
1210 gain *= s->dynamic_range[2 - ch];
1211 } else {
1212 gain *= s->dynamic_range[0];
1214 s->fmt_conv.int32_to_float_fmul_scalar(s->transform_coeffs[ch],
1215 s->fixed_coeffs[ch], gain, 256);
1218 /* apply spectral extension to high frequency bins */
1219 if (s->spx_in_use && CONFIG_EAC3_DECODER) {
1220 ff_eac3_apply_spectral_extension(s);
1223 /* downmix and MDCT. order depends on whether block switching is used for
1224 any channel in this block. this is because coefficients for the long
1225 and short transforms cannot be mixed. */
1226 downmix_output = s->channels != s->out_channels &&
1227 !((s->output_mode & AC3_OUTPUT_LFEON) &&
1228 s->fbw_channels == s->out_channels);
1229 if (different_transforms) {
1230 /* the delay samples have already been downmixed, so we upmix the delay
1231 samples in order to reconstruct all channels before downmixing. */
1232 if (s->downmixed) {
1233 s->downmixed = 0;
1234 ac3_upmix_delay(s);
1237 do_imdct(s, s->channels);
1239 if (downmix_output) {
1240 s->ac3dsp.downmix(s->outptr, s->downmix_coeffs,
1241 s->out_channels, s->fbw_channels, 256);
1243 } else {
1244 if (downmix_output) {
1245 s->ac3dsp.downmix(s->xcfptr + 1, s->downmix_coeffs,
1246 s->out_channels, s->fbw_channels, 256);
1249 if (downmix_output && !s->downmixed) {
1250 s->downmixed = 1;
1251 s->ac3dsp.downmix(s->dlyptr, s->downmix_coeffs, s->out_channels,
1252 s->fbw_channels, 128);
1255 do_imdct(s, s->out_channels);
1258 return 0;
1262 * Decode a single AC-3 frame.
1264 static int ac3_decode_frame(AVCodecContext * avctx, void *data,
1265 int *got_frame_ptr, AVPacket *avpkt)
1267 AVFrame *frame = data;
1268 const uint8_t *buf = avpkt->data;
1269 int buf_size = avpkt->size;
1270 AC3DecodeContext *s = avctx->priv_data;
1271 int blk, ch, err, ret;
1272 const uint8_t *channel_map;
1273 const float *output[AC3_MAX_CHANNELS];
1275 /* copy input buffer to decoder context to avoid reading past the end
1276 of the buffer, which can be caused by a damaged input stream. */
1277 if (buf_size >= 2 && AV_RB16(buf) == 0x770B) {
1278 // seems to be byte-swapped AC-3
1279 int cnt = FFMIN(buf_size, AC3_FRAME_BUFFER_SIZE) >> 1;
1280 s->dsp.bswap16_buf((uint16_t *)s->input_buffer, (const uint16_t *)buf, cnt);
1281 } else
1282 memcpy(s->input_buffer, buf, FFMIN(buf_size, AC3_FRAME_BUFFER_SIZE));
1283 buf = s->input_buffer;
1284 /* initialize the GetBitContext with the start of valid AC-3 Frame */
1285 init_get_bits(&s->gbc, buf, buf_size * 8);
1287 /* parse the syncinfo */
1288 err = parse_frame_header(s);
1290 if (err) {
1291 switch (err) {
1292 case AAC_AC3_PARSE_ERROR_SYNC:
1293 av_log(avctx, AV_LOG_ERROR, "frame sync error\n");
1294 return -1;
1295 case AAC_AC3_PARSE_ERROR_BSID:
1296 av_log(avctx, AV_LOG_ERROR, "invalid bitstream id\n");
1297 break;
1298 case AAC_AC3_PARSE_ERROR_SAMPLE_RATE:
1299 av_log(avctx, AV_LOG_ERROR, "invalid sample rate\n");
1300 break;
1301 case AAC_AC3_PARSE_ERROR_FRAME_SIZE:
1302 av_log(avctx, AV_LOG_ERROR, "invalid frame size\n");
1303 break;
1304 case AAC_AC3_PARSE_ERROR_FRAME_TYPE:
1305 /* skip frame if CRC is ok. otherwise use error concealment. */
1306 /* TODO: add support for substreams and dependent frames */
1307 if (s->frame_type == EAC3_FRAME_TYPE_DEPENDENT || s->substreamid) {
1308 av_log(avctx, AV_LOG_ERROR, "unsupported frame type : "
1309 "skipping frame\n");
1310 *got_frame_ptr = 0;
1311 return s->frame_size;
1312 } else {
1313 av_log(avctx, AV_LOG_ERROR, "invalid frame type\n");
1315 break;
1316 default:
1317 av_log(avctx, AV_LOG_ERROR, "invalid header\n");
1318 break;
1320 } else {
1321 /* check that reported frame size fits in input buffer */
1322 if (s->frame_size > buf_size) {
1323 av_log(avctx, AV_LOG_ERROR, "incomplete frame\n");
1324 err = AAC_AC3_PARSE_ERROR_FRAME_SIZE;
1325 } else if (avctx->err_recognition & AV_EF_CRCCHECK) {
1326 /* check for crc mismatch */
1327 if (av_crc(av_crc_get_table(AV_CRC_16_ANSI), 0, &buf[2],
1328 s->frame_size - 2)) {
1329 av_log(avctx, AV_LOG_ERROR, "frame CRC mismatch\n");
1330 err = AAC_AC3_PARSE_ERROR_CRC;
1335 /* if frame is ok, set audio parameters */
1336 if (!err) {
1337 avctx->sample_rate = s->sample_rate;
1338 avctx->bit_rate = s->bit_rate;
1340 /* channel config */
1341 s->out_channels = s->channels;
1342 s->output_mode = s->channel_mode;
1343 if (s->lfe_on)
1344 s->output_mode |= AC3_OUTPUT_LFEON;
1345 if (avctx->request_channels > 0 && avctx->request_channels <= 2 &&
1346 avctx->request_channels < s->channels) {
1347 s->out_channels = avctx->request_channels;
1348 s->output_mode = avctx->request_channels == 1 ? AC3_CHMODE_MONO : AC3_CHMODE_STEREO;
1349 s->channel_layout = avpriv_ac3_channel_layout_tab[s->output_mode];
1351 avctx->channels = s->out_channels;
1352 avctx->channel_layout = s->channel_layout;
1354 /* set downmixing coefficients if needed */
1355 if (s->channels != s->out_channels && !((s->output_mode & AC3_OUTPUT_LFEON) &&
1356 s->fbw_channels == s->out_channels)) {
1357 set_downmix_coeffs(s);
1359 } else if (!s->out_channels) {
1360 s->out_channels = avctx->channels;
1361 if (s->out_channels < s->channels)
1362 s->output_mode = s->out_channels == 1 ? AC3_CHMODE_MONO : AC3_CHMODE_STEREO;
1364 /* set audio service type based on bitstream mode for AC-3 */
1365 avctx->audio_service_type = s->bitstream_mode;
1366 if (s->bitstream_mode == 0x7 && s->channels > 1)
1367 avctx->audio_service_type = AV_AUDIO_SERVICE_TYPE_KARAOKE;
1369 /* get output buffer */
1370 avctx->channels = s->out_channels;
1371 frame->nb_samples = s->num_blocks * 256;
1372 if ((ret = ff_get_buffer(avctx, frame)) < 0) {
1373 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n");
1374 return ret;
1377 /* decode the audio blocks */
1378 channel_map = ff_ac3_dec_channel_map[s->output_mode & ~AC3_OUTPUT_LFEON][s->lfe_on];
1379 for (ch = 0; ch < s->channels; ch++) {
1380 if (ch < s->out_channels)
1381 s->outptr[channel_map[ch]] = (float *)frame->data[ch];
1382 else
1383 s->outptr[ch] = s->output[ch];
1384 output[ch] = s->output[ch];
1386 for (blk = 0; blk < s->num_blocks; blk++) {
1387 if (!err && decode_audio_block(s, blk)) {
1388 av_log(avctx, AV_LOG_ERROR, "error decoding the audio block\n");
1389 err = 1;
1391 if (err)
1392 for (ch = 0; ch < s->out_channels; ch++)
1393 memcpy(s->outptr[channel_map[ch]], output[ch], 1024);
1394 for (ch = 0; ch < s->out_channels; ch++) {
1395 output[ch] = s->outptr[channel_map[ch]];
1396 s->outptr[channel_map[ch]] += AC3_BLOCK_SIZE;
1400 /* keep last block for error concealment in next frame */
1401 for (ch = 0; ch < s->out_channels; ch++)
1402 memcpy(s->output[ch], output[ch], 1024);
1404 *got_frame_ptr = 1;
1406 return FFMIN(buf_size, s->frame_size);
1410 * Uninitialize the AC-3 decoder.
1412 static av_cold int ac3_decode_end(AVCodecContext *avctx)
1414 AC3DecodeContext *s = avctx->priv_data;
1415 ff_mdct_end(&s->imdct_512);
1416 ff_mdct_end(&s->imdct_256);
1418 return 0;
1421 #define OFFSET(x) offsetof(AC3DecodeContext, x)
1422 #define PAR (AV_OPT_FLAG_DECODING_PARAM | AV_OPT_FLAG_AUDIO_PARAM)
1423 static const AVOption options[] = {
1424 { "drc_scale", "percentage of dynamic range compression to apply", OFFSET(drc_scale), AV_OPT_TYPE_FLOAT, {.dbl = 1.0}, 0.0, 1.0, PAR },
1425 { NULL},
1428 static const AVClass ac3_decoder_class = {
1429 .class_name = "AC3 decoder",
1430 .item_name = av_default_item_name,
1431 .option = options,
1432 .version = LIBAVUTIL_VERSION_INT,
1435 AVCodec ff_ac3_decoder = {
1436 .name = "ac3",
1437 .type = AVMEDIA_TYPE_AUDIO,
1438 .id = AV_CODEC_ID_AC3,
1439 .priv_data_size = sizeof (AC3DecodeContext),
1440 .init = ac3_decode_init,
1441 .close = ac3_decode_end,
1442 .decode = ac3_decode_frame,
1443 .capabilities = CODEC_CAP_DR1,
1444 .long_name = NULL_IF_CONFIG_SMALL("ATSC A/52A (AC-3)"),
1445 .sample_fmts = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLTP,
1446 AV_SAMPLE_FMT_NONE },
1447 .priv_class = &ac3_decoder_class,
1450 #if CONFIG_EAC3_DECODER
1451 static const AVClass eac3_decoder_class = {
1452 .class_name = "E-AC3 decoder",
1453 .item_name = av_default_item_name,
1454 .option = options,
1455 .version = LIBAVUTIL_VERSION_INT,
1458 AVCodec ff_eac3_decoder = {
1459 .name = "eac3",
1460 .type = AVMEDIA_TYPE_AUDIO,
1461 .id = AV_CODEC_ID_EAC3,
1462 .priv_data_size = sizeof (AC3DecodeContext),
1463 .init = ac3_decode_init,
1464 .close = ac3_decode_end,
1465 .decode = ac3_decode_frame,
1466 .capabilities = CODEC_CAP_DR1,
1467 .long_name = NULL_IF_CONFIG_SMALL("ATSC A/52B (AC-3, E-AC-3)"),
1468 .sample_fmts = (const enum AVSampleFormat[]) { AV_SAMPLE_FMT_FLTP,
1469 AV_SAMPLE_FMT_NONE },
1470 .priv_class = &eac3_decoder_class,
1472 #endif