blob: f8f0eb45f64360cd8692faa814fb069bde0cd080 [file] [log] [blame]
Kostya Shishkovc03d9d02008-08-14 05:52:291/*
2 * AAC encoder
3 * Copyright (C) 2008 Konstantin Shishkov
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22/**
Diego Biurrunba87f082010-04-20 14:45:3423 * @file
Kostya Shishkovc03d9d02008-08-14 05:52:2924 * AAC encoder
25 */
26
27/***********************************
28 * TODOs:
Kostya Shishkov817015e2008-08-16 05:47:1829 * add sane pulse detection
Kostya Shishkove43b0a72008-08-24 05:56:2330 * add temporal noise shaping
Kostya Shishkovc03d9d02008-08-14 05:52:2931 ***********************************/
32
33#include "avcodec.h"
Alex Converse78e65cd2009-07-08 20:01:3134#include "put_bits.h"
Kostya Shishkovc03d9d02008-08-14 05:52:2935#include "dsputil.h"
36#include "mpeg4audio.h"
37
Kostya Shishkovc03d9d02008-08-14 05:52:2938#include "aac.h"
39#include "aactab.h"
Alex Converse78e65cd2009-07-08 20:01:3140#include "aacenc.h"
41
42#include "psymodel.h"
Kostya Shishkovc03d9d02008-08-14 05:52:2943
Måns Rullgård86e41bc32010-07-06 00:06:1544#define AAC_MAX_CHANNELS 6
45
Kostya Shishkovc03d9d02008-08-14 05:52:2946static const uint8_t swb_size_1024_96[] = {
47 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 8, 8, 8, 8, 8,
48 12, 12, 12, 12, 12, 16, 16, 24, 28, 36, 44,
49 64, 64, 64, 64, 64, 64, 64, 64, 64, 64, 64
50};
51
52static const uint8_t swb_size_1024_64[] = {
53 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 8, 8, 8, 8,
54 12, 12, 12, 16, 16, 16, 20, 24, 24, 28, 36,
55 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40, 40
56};
57
58static const uint8_t swb_size_1024_48[] = {
59 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 8, 8, 8, 8, 8, 8, 8,
60 12, 12, 12, 12, 16, 16, 20, 20, 24, 24, 28, 28,
61 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32,
62 96
63};
64
65static const uint8_t swb_size_1024_32[] = {
66 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 8, 8, 8, 8, 8, 8, 8,
67 12, 12, 12, 12, 16, 16, 20, 20, 24, 24, 28, 28,
68 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32, 32
69};
70
71static const uint8_t swb_size_1024_24[] = {
72 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 4, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
73 12, 12, 12, 12, 16, 16, 16, 20, 20, 24, 24, 28, 28,
74 32, 36, 36, 40, 44, 48, 52, 52, 64, 64, 64, 64, 64
75};
76
77static const uint8_t swb_size_1024_16[] = {
78 8, 8, 8, 8, 8, 8, 8, 8, 8, 8, 8,
79 12, 12, 12, 12, 12, 12, 12, 12, 12, 16, 16, 16, 16, 20, 20, 20, 24, 24, 28, 28,
80 32, 36, 40, 40, 44, 48, 52, 56, 60, 64, 64, 64
81};
82
83static const uint8_t swb_size_1024_8[] = {
84 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12,
85 16, 16, 16, 16, 16, 16, 16, 20, 20, 20, 20, 24, 24, 24, 28, 28,
86 32, 36, 36, 40, 44, 48, 52, 56, 60, 64, 80
87};
88
Alex Converse78e65cd2009-07-08 20:01:3189static const uint8_t *swb_size_1024[] = {
Kostya Shishkovc03d9d02008-08-14 05:52:2990 swb_size_1024_96, swb_size_1024_96, swb_size_1024_64,
91 swb_size_1024_48, swb_size_1024_48, swb_size_1024_32,
92 swb_size_1024_24, swb_size_1024_24, swb_size_1024_16,
93 swb_size_1024_16, swb_size_1024_16, swb_size_1024_8
94};
95
96static const uint8_t swb_size_128_96[] = {
97 4, 4, 4, 4, 4, 4, 8, 8, 8, 16, 28, 36
98};
99
100static const uint8_t swb_size_128_48[] = {
101 4, 4, 4, 4, 4, 8, 8, 8, 12, 12, 12, 16, 16, 16
102};
103
104static const uint8_t swb_size_128_24[] = {
105 4, 4, 4, 4, 4, 4, 4, 8, 8, 8, 12, 12, 16, 16, 20
106};
107
108static const uint8_t swb_size_128_16[] = {
109 4, 4, 4, 4, 4, 4, 4, 4, 8, 8, 12, 12, 16, 20, 20
110};
111
112static const uint8_t swb_size_128_8[] = {
113 4, 4, 4, 4, 4, 4, 4, 8, 8, 8, 8, 12, 16, 20, 20
114};
115
Alex Converse78e65cd2009-07-08 20:01:31116static const uint8_t *swb_size_128[] = {
Kostya Shishkovc03d9d02008-08-14 05:52:29117 /* the last entry on the following row is swb_size_128_64 but is a
118 duplicate of swb_size_128_96 */
119 swb_size_128_96, swb_size_128_96, swb_size_128_96,
120 swb_size_128_48, swb_size_128_48, swb_size_128_48,
121 swb_size_128_24, swb_size_128_24, swb_size_128_16,
122 swb_size_128_16, swb_size_128_16, swb_size_128_8
123};
124
Kostya Shishkovc03d9d02008-08-14 05:52:29125/** default channel configurations */
126static const uint8_t aac_chan_configs[6][5] = {
Kostya Shishkovf5c3eae2008-08-16 11:59:36127 {1, TYPE_SCE}, // 1 channel - single channel element
128 {1, TYPE_CPE}, // 2 channels - channel pair
129 {2, TYPE_SCE, TYPE_CPE}, // 3 channels - center + stereo
130 {3, TYPE_SCE, TYPE_CPE, TYPE_SCE}, // 4 channels - front center + stereo + back center
131 {3, TYPE_SCE, TYPE_CPE, TYPE_CPE}, // 5 channels - front center + stereo + back stereo
132 {4, TYPE_SCE, TYPE_CPE, TYPE_CPE, TYPE_LFE}, // 6 channels - front center + stereo + back stereo + LFE
Kostya Shishkovc03d9d02008-08-14 05:52:29133};
134
135/**
Kostya Shishkovc03d9d02008-08-14 05:52:29136 * Make AAC audio config object.
137 * @see 1.6.2.1 "Syntax - AudioSpecificConfig"
138 */
139static void put_audio_specific_config(AVCodecContext *avctx)
140{
141 PutBitContext pb;
142 AACEncContext *s = avctx->priv_data;
143
144 init_put_bits(&pb, avctx->extradata, avctx->extradata_size*8);
145 put_bits(&pb, 5, 2); //object type - AAC-LC
146 put_bits(&pb, 4, s->samplerate_index); //sample rate index
147 put_bits(&pb, 4, avctx->channels);
148 //GASpecificConfig
149 put_bits(&pb, 1, 0); //frame length - 1024 samples
150 put_bits(&pb, 1, 0); //does not depend on core coder
151 put_bits(&pb, 1, 0); //is not extension
Alex Conversed67a6aa2011-01-22 05:23:43152
153 //Explicitly Mark SBR absent
154 put_bits(&pb, 11, 0x27b); //sync extension
155 put_bits(&pb, 5, AOT_SBR);
156 put_bits(&pb, 1, 0);
Kostya Shishkovc03d9d02008-08-14 05:52:29157 flush_put_bits(&pb);
158}
159
160static av_cold int aac_encode_init(AVCodecContext *avctx)
161{
162 AACEncContext *s = avctx->priv_data;
163 int i;
Alex Converse78e65cd2009-07-08 20:01:31164 const uint8_t *sizes[2];
165 int lengths[2];
Kostya Shishkovc03d9d02008-08-14 05:52:29166
167 avctx->frame_size = 1024;
168
Alex Conversefd257dc2009-07-08 20:36:45169 for (i = 0; i < 16; i++)
170 if (avctx->sample_rate == ff_mpeg4audio_sample_rates[i])
Kostya Shishkovc03d9d02008-08-14 05:52:29171 break;
Alex Conversefd257dc2009-07-08 20:36:45172 if (i == 16) {
Kostya Shishkovc03d9d02008-08-14 05:52:29173 av_log(avctx, AV_LOG_ERROR, "Unsupported sample rate %d\n", avctx->sample_rate);
174 return -1;
175 }
Måns Rullgård86e41bc32010-07-06 00:06:15176 if (avctx->channels > AAC_MAX_CHANNELS) {
Kostya Shishkovc03d9d02008-08-14 05:52:29177 av_log(avctx, AV_LOG_ERROR, "Unsupported number of channels: %d\n", avctx->channels);
178 return -1;
179 }
Alex Converse52342922010-04-02 16:26:10180 if (avctx->profile != FF_PROFILE_UNKNOWN && avctx->profile != FF_PROFILE_AAC_LOW) {
181 av_log(avctx, AV_LOG_ERROR, "Unsupported profile %d\n", avctx->profile);
182 return -1;
183 }
Alex Converse217b44d2010-05-06 20:35:10184 if (1024.0 * avctx->bit_rate / avctx->sample_rate > 6144 * avctx->channels) {
185 av_log(avctx, AV_LOG_ERROR, "Too many bits per frame requested\n");
186 return -1;
187 }
Kostya Shishkovc03d9d02008-08-14 05:52:29188 s->samplerate_index = i;
Kostya Shishkovc03d9d02008-08-14 05:52:29189
190 dsputil_init(&s->dsp, avctx);
Siarhei Siamashka7d485f12009-05-16 14:17:08191 ff_mdct_init(&s->mdct1024, 11, 0, 1.0);
192 ff_mdct_init(&s->mdct128, 8, 0, 1.0);
Kostya Shishkov817015e2008-08-16 05:47:18193 // window init
194 ff_kbd_window_init(ff_aac_kbd_long_1024, 4.0, 1024);
195 ff_kbd_window_init(ff_aac_kbd_short_128, 6.0, 128);
Reimar Döffinger14b86072010-01-09 13:28:04196 ff_init_ff_sine_windows(10);
197 ff_init_ff_sine_windows(7);
Kostya Shishkovc03d9d02008-08-14 05:52:29198
Diego Biurrun99d61d32009-07-08 21:16:06199 s->samples = av_malloc(2 * 1024 * avctx->channels * sizeof(s->samples[0]));
200 s->cpe = av_mallocz(sizeof(ChannelElement) * aac_chan_configs[avctx->channels-1][0]);
Alex Conversed67a6aa2011-01-22 05:23:43201 avctx->extradata = av_mallocz(5 + FF_INPUT_BUFFER_PADDING_SIZE);
202 avctx->extradata_size = 5;
Kostya Shishkovc03d9d02008-08-14 05:52:29203 put_audio_specific_config(avctx);
Alex Converse78e65cd2009-07-08 20:01:31204
Diego Biurrun99d61d32009-07-08 21:16:06205 sizes[0] = swb_size_1024[i];
206 sizes[1] = swb_size_128[i];
Alex Converse78e65cd2009-07-08 20:01:31207 lengths[0] = ff_aac_num_swb_1024[i];
208 lengths[1] = ff_aac_num_swb_128[i];
209 ff_psy_init(&s->psy, avctx, 2, sizes, lengths);
210 s->psypp = ff_psy_preprocess_init(avctx);
Alex Converse960323a2010-05-14 16:49:21211 s->coder = &ff_aac_coders[2];
Alex Converse78e65cd2009-07-08 20:01:31212
213 s->lambda = avctx->global_quality ? avctx->global_quality : 120;
Alex Conversee29af812010-06-23 19:30:01214
215 ff_aac_tableinit();
Alex Converse78e65cd2009-07-08 20:01:31216
Kostya Shishkovc03d9d02008-08-14 05:52:29217 return 0;
218}
219
Alex Converse78e65cd2009-07-08 20:01:31220static void apply_window_and_mdct(AVCodecContext *avctx, AACEncContext *s,
Nathan Caldwell00454992010-07-19 18:19:53221 SingleChannelElement *sce, short *audio)
Alex Converse78e65cd2009-07-08 20:01:31222{
Nathan Caldwell00454992010-07-19 18:19:53223 int i, k;
224 const int chans = avctx->channels;
Alex Converse78e65cd2009-07-08 20:01:31225 const float * lwindow = sce->ics.use_kb_window[0] ? ff_aac_kbd_long_1024 : ff_sine_1024;
226 const float * swindow = sce->ics.use_kb_window[0] ? ff_aac_kbd_short_128 : ff_sine_128;
227 const float * pwindow = sce->ics.use_kb_window[1] ? ff_aac_kbd_short_128 : ff_sine_128;
228
229 if (sce->ics.window_sequence[0] != EIGHT_SHORT_SEQUENCE) {
230 memcpy(s->output, sce->saved, sizeof(float)*1024);
Alex Conversefd257dc2009-07-08 20:36:45231 if (sce->ics.window_sequence[0] == LONG_STOP_SEQUENCE) {
Alex Converse78e65cd2009-07-08 20:01:31232 memset(s->output, 0, sizeof(s->output[0]) * 448);
Alex Conversefd257dc2009-07-08 20:36:45233 for (i = 448; i < 576; i++)
Alex Converse78e65cd2009-07-08 20:01:31234 s->output[i] = sce->saved[i] * pwindow[i - 448];
Alex Conversefd257dc2009-07-08 20:36:45235 for (i = 576; i < 704; i++)
Alex Converse78e65cd2009-07-08 20:01:31236 s->output[i] = sce->saved[i];
237 }
Alex Conversefd257dc2009-07-08 20:36:45238 if (sce->ics.window_sequence[0] != LONG_START_SEQUENCE) {
Nathan Caldwell00454992010-07-19 18:19:53239 for (i = 0; i < 1024; i++) {
240 s->output[i+1024] = audio[i * chans] * lwindow[1024 - i - 1];
241 sce->saved[i] = audio[i * chans] * lwindow[i];
Alex Converse78e65cd2009-07-08 20:01:31242 }
Alex Conversefd257dc2009-07-08 20:36:45243 } else {
Nathan Caldwell00454992010-07-19 18:19:53244 for (i = 0; i < 448; i++)
245 s->output[i+1024] = audio[i * chans];
246 for (; i < 576; i++)
247 s->output[i+1024] = audio[i * chans] * swindow[576 - i - 1];
Alex Converse78e65cd2009-07-08 20:01:31248 memset(s->output+1024+576, 0, sizeof(s->output[0]) * 448);
Nathan Caldwell00454992010-07-19 18:19:53249 for (i = 0; i < 1024; i++)
250 sce->saved[i] = audio[i * chans];
Alex Converse78e65cd2009-07-08 20:01:31251 }
252 ff_mdct_calc(&s->mdct1024, sce->coeffs, s->output);
Alex Conversefd257dc2009-07-08 20:36:45253 } else {
Alex Converse78e65cd2009-07-08 20:01:31254 for (k = 0; k < 1024; k += 128) {
Alex Conversefd257dc2009-07-08 20:36:45255 for (i = 448 + k; i < 448 + k + 256; i++)
Alex Converse78e65cd2009-07-08 20:01:31256 s->output[i - 448 - k] = (i < 1024)
257 ? sce->saved[i]
Nathan Caldwell00454992010-07-19 18:19:53258 : audio[(i-1024)*chans];
Alex Converse78e65cd2009-07-08 20:01:31259 s->dsp.vector_fmul (s->output, k ? swindow : pwindow, 128);
260 s->dsp.vector_fmul_reverse(s->output+128, s->output+128, swindow, 128);
261 ff_mdct_calc(&s->mdct128, sce->coeffs + k, s->output);
262 }
Nathan Caldwell00454992010-07-19 18:19:53263 for (i = 0; i < 1024; i++)
264 sce->saved[i] = audio[i * chans];
Alex Converse78e65cd2009-07-08 20:01:31265 }
266}
267
Kostya Shishkovc03d9d02008-08-14 05:52:29268/**
269 * Encode ics_info element.
270 * @see Table 4.6 (syntax of ics_info)
271 */
Kostya Shishkove43b0a72008-08-24 05:56:23272static void put_ics_info(AACEncContext *s, IndividualChannelStream *info)
Kostya Shishkovc03d9d02008-08-14 05:52:29273{
Alex Converse78e65cd2009-07-08 20:01:31274 int w;
Kostya Shishkovc03d9d02008-08-14 05:52:29275
276 put_bits(&s->pb, 1, 0); // ics_reserved bit
277 put_bits(&s->pb, 2, info->window_sequence[0]);
278 put_bits(&s->pb, 1, info->use_kb_window[0]);
Alex Conversefd257dc2009-07-08 20:36:45279 if (info->window_sequence[0] != EIGHT_SHORT_SEQUENCE) {
Kostya Shishkovc03d9d02008-08-14 05:52:29280 put_bits(&s->pb, 6, info->max_sfb);
281 put_bits(&s->pb, 1, 0); // no prediction
Alex Conversefd257dc2009-07-08 20:36:45282 } else {
Kostya Shishkovc03d9d02008-08-14 05:52:29283 put_bits(&s->pb, 4, info->max_sfb);
Diego Biurrunc8f47d82009-07-08 21:36:33284 for (w = 1; w < 8; w++)
Alex Converse78e65cd2009-07-08 20:01:31285 put_bits(&s->pb, 1, !info->group_len[w]);
Kostya Shishkovc03d9d02008-08-14 05:52:29286 }
287}
288
289/**
Alex Converse78e65cd2009-07-08 20:01:31290 * Encode MS data.
291 * @see 4.6.8.1 "Joint Coding - M/S Stereo"
Kostya Shishkove43b0a72008-08-24 05:56:23292 */
Alex Converse78e65cd2009-07-08 20:01:31293static void encode_ms_info(PutBitContext *pb, ChannelElement *cpe)
Kostya Shishkove43b0a72008-08-24 05:56:23294{
Kostya Shishkove43b0a72008-08-24 05:56:23295 int i, w;
Alex Converse78e65cd2009-07-08 20:01:31296
297 put_bits(pb, 2, cpe->ms_mode);
Diego Biurrunc8f47d82009-07-08 21:36:33298 if (cpe->ms_mode == 1)
299 for (w = 0; w < cpe->ch[0].ics.num_windows; w += cpe->ch[0].ics.group_len[w])
Alex Conversefd257dc2009-07-08 20:36:45300 for (i = 0; i < cpe->ch[0].ics.max_sfb; i++)
Alex Converse78e65cd2009-07-08 20:01:31301 put_bits(pb, 1, cpe->ms_mask[w*16 + i]);
Alex Converse78e65cd2009-07-08 20:01:31302}
303
304/**
305 * Produce integer coefficients from scalefactors provided by the model.
306 */
307static void adjust_frame_information(AACEncContext *apc, ChannelElement *cpe, int chans)
308{
309 int i, w, w2, g, ch;
Alex Converse99d7a3e2010-08-31 00:33:56310 int start, maxsfb, cmaxsfb;
Alex Converse78e65cd2009-07-08 20:01:31311
Alex Conversefd257dc2009-07-08 20:36:45312 for (ch = 0; ch < chans; ch++) {
Alex Converse78e65cd2009-07-08 20:01:31313 IndividualChannelStream *ics = &cpe->ch[ch].ics;
314 start = 0;
315 maxsfb = 0;
316 cpe->ch[ch].pulse.num_pulse = 0;
Alex Conversefd257dc2009-07-08 20:36:45317 for (w = 0; w < ics->num_windows*16; w += 16) {
318 for (g = 0; g < ics->num_swb; g++) {
Alex Converse78e65cd2009-07-08 20:01:31319 //apply M/S
Alex Converse76dfe4e2010-08-30 23:43:03320 if (cpe->common_window && !ch && cpe->ms_mask[w + g]) {
Alex Conversefd257dc2009-07-08 20:36:45321 for (i = 0; i < ics->swb_sizes[g]; i++) {
Alex Converse78e65cd2009-07-08 20:01:31322 cpe->ch[0].coeffs[start+i] = (cpe->ch[0].coeffs[start+i] + cpe->ch[1].coeffs[start+i]) / 2.0;
323 cpe->ch[1].coeffs[start+i] = cpe->ch[0].coeffs[start+i] - cpe->ch[1].coeffs[start+i];
324 }
325 }
326 start += ics->swb_sizes[g];
327 }
Diego Biurrunc8f47d82009-07-08 21:36:33328 for (cmaxsfb = ics->num_swb; cmaxsfb > 0 && cpe->ch[ch].zeroes[w+cmaxsfb-1]; cmaxsfb--)
329 ;
Alex Converse78e65cd2009-07-08 20:01:31330 maxsfb = FFMAX(maxsfb, cmaxsfb);
331 }
332 ics->max_sfb = maxsfb;
333
334 //adjust zero bands for window groups
Alex Conversefd257dc2009-07-08 20:36:45335 for (w = 0; w < ics->num_windows; w += ics->group_len[w]) {
336 for (g = 0; g < ics->max_sfb; g++) {
Alex Converse78e65cd2009-07-08 20:01:31337 i = 1;
Alex Conversefd257dc2009-07-08 20:36:45338 for (w2 = w; w2 < w + ics->group_len[w]; w2++) {
339 if (!cpe->ch[ch].zeroes[w2*16 + g]) {
Alex Converse78e65cd2009-07-08 20:01:31340 i = 0;
341 break;
342 }
343 }
344 cpe->ch[ch].zeroes[w*16 + g] = i;
345 }
346 }
347 }
348
Alex Conversefd257dc2009-07-08 20:36:45349 if (chans > 1 && cpe->common_window) {
Alex Converse78e65cd2009-07-08 20:01:31350 IndividualChannelStream *ics0 = &cpe->ch[0].ics;
351 IndividualChannelStream *ics1 = &cpe->ch[1].ics;
352 int msc = 0;
353 ics0->max_sfb = FFMAX(ics0->max_sfb, ics1->max_sfb);
354 ics1->max_sfb = ics0->max_sfb;
Alex Conversefd257dc2009-07-08 20:36:45355 for (w = 0; w < ics0->num_windows*16; w += 16)
356 for (i = 0; i < ics0->max_sfb; i++)
Diego Biurrunc8f47d82009-07-08 21:36:33357 if (cpe->ms_mask[w+i])
358 msc++;
Diego Biurrun99d61d32009-07-08 21:16:06359 if (msc == 0 || ics0->max_sfb == 0)
360 cpe->ms_mode = 0;
361 else
362 cpe->ms_mode = msc < ics0->max_sfb ? 1 : 2;
Alex Converse78e65cd2009-07-08 20:01:31363 }
364}
365
366/**
367 * Encode scalefactor band coding type.
368 */
369static void encode_band_info(AACEncContext *s, SingleChannelElement *sce)
370{
371 int w;
372
Diego Biurrunc8f47d82009-07-08 21:36:33373 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w])
Alex Converse78e65cd2009-07-08 20:01:31374 s->coder->encode_window_bands_info(s, sce, w, sce->ics.group_len[w], s->lambda);
Alex Converse78e65cd2009-07-08 20:01:31375}
376
377/**
378 * Encode scalefactors.
379 */
Diego Biurrun99d61d32009-07-08 21:16:06380static void encode_scale_factors(AVCodecContext *avctx, AACEncContext *s,
381 SingleChannelElement *sce)
Alex Converse78e65cd2009-07-08 20:01:31382{
383 int off = sce->sf_idx[0], diff;
384 int i, w;
385
Alex Conversefd257dc2009-07-08 20:36:45386 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
387 for (i = 0; i < sce->ics.max_sfb; i++) {
388 if (!sce->zeroes[w*16 + i]) {
Alex Converse78e65cd2009-07-08 20:01:31389 diff = sce->sf_idx[w*16 + i] - off + SCALE_DIFF_ZERO;
Diego Biurrun99d61d32009-07-08 21:16:06390 if (diff < 0 || diff > 120)
391 av_log(avctx, AV_LOG_ERROR, "Scalefactor difference is too big to be coded\n");
Alex Converse78e65cd2009-07-08 20:01:31392 off = sce->sf_idx[w*16 + i];
393 put_bits(&s->pb, ff_aac_scalefactor_bits[diff], ff_aac_scalefactor_code[diff]);
394 }
395 }
396 }
Kostya Shishkove43b0a72008-08-24 05:56:23397}
398
399/**
Kostya Shishkov817015e2008-08-16 05:47:18400 * Encode pulse data.
401 */
Kostya Shishkovcda00de2008-08-23 15:25:57402static void encode_pulses(AACEncContext *s, Pulse *pulse)
Kostya Shishkov817015e2008-08-16 05:47:18403{
404 int i;
405
406 put_bits(&s->pb, 1, !!pulse->num_pulse);
Diego Biurrun99d61d32009-07-08 21:16:06407 if (!pulse->num_pulse)
408 return;
Kostya Shishkov817015e2008-08-16 05:47:18409
410 put_bits(&s->pb, 2, pulse->num_pulse - 1);
411 put_bits(&s->pb, 6, pulse->start);
Alex Conversefd257dc2009-07-08 20:36:45412 for (i = 0; i < pulse->num_pulse; i++) {
Kostya Shishkovf5c3eae2008-08-16 11:59:36413 put_bits(&s->pb, 5, pulse->pos[i]);
Kostya Shishkov817015e2008-08-16 05:47:18414 put_bits(&s->pb, 4, pulse->amp[i]);
415 }
416}
417
418/**
419 * Encode spectral coefficients processed by psychoacoustic model.
420 */
Kostya Shishkovcda00de2008-08-23 15:25:57421static void encode_spectral_coeffs(AACEncContext *s, SingleChannelElement *sce)
Kostya Shishkov817015e2008-08-16 05:47:18422{
Alex Converse78e65cd2009-07-08 20:01:31423 int start, i, w, w2;
Kostya Shishkov817015e2008-08-16 05:47:18424
Alex Conversefd257dc2009-07-08 20:36:45425 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Kostya Shishkov817015e2008-08-16 05:47:18426 start = 0;
Alex Conversefd257dc2009-07-08 20:36:45427 for (i = 0; i < sce->ics.max_sfb; i++) {
428 if (sce->zeroes[w*16 + i]) {
Kostya Shishkovcda00de2008-08-23 15:25:57429 start += sce->ics.swb_sizes[i];
Kostya Shishkov817015e2008-08-16 05:47:18430 continue;
431 }
Diego Biurrunc8f47d82009-07-08 21:36:33432 for (w2 = w; w2 < w + sce->ics.group_len[w]; w2++)
Alex Converse78e65cd2009-07-08 20:01:31433 s->coder->quantize_and_encode_band(s, &s->pb, sce->coeffs + start + w2*128,
Diego Biurrun99d61d32009-07-08 21:16:06434 sce->ics.swb_sizes[i],
435 sce->sf_idx[w*16 + i],
436 sce->band_type[w*16 + i],
437 s->lambda);
Kostya Shishkovcda00de2008-08-23 15:25:57438 start += sce->ics.swb_sizes[i];
Kostya Shishkov817015e2008-08-16 05:47:18439 }
Kostya Shishkov817015e2008-08-16 05:47:18440 }
441}
442
443/**
Alex Converse78e65cd2009-07-08 20:01:31444 * Encode one channel of audio data.
445 */
Diego Biurrun99d61d32009-07-08 21:16:06446static int encode_individual_channel(AVCodecContext *avctx, AACEncContext *s,
447 SingleChannelElement *sce,
448 int common_window)
Alex Converse78e65cd2009-07-08 20:01:31449{
450 put_bits(&s->pb, 8, sce->sf_idx[0]);
Diego Biurrun99d61d32009-07-08 21:16:06451 if (!common_window)
452 put_ics_info(s, &sce->ics);
Alex Converse78e65cd2009-07-08 20:01:31453 encode_band_info(s, sce);
454 encode_scale_factors(avctx, s, sce);
455 encode_pulses(s, &sce->pulse);
456 put_bits(&s->pb, 1, 0); //tns
457 put_bits(&s->pb, 1, 0); //ssr
458 encode_spectral_coeffs(s, sce);
459 return 0;
460}
461
462/**
Kostya Shishkovc03d9d02008-08-14 05:52:29463 * Write some auxiliary information about the created AAC file.
464 */
Diego Biurrun99d61d32009-07-08 21:16:06465static void put_bitstream_info(AVCodecContext *avctx, AACEncContext *s,
466 const char *name)
Kostya Shishkovc03d9d02008-08-14 05:52:29467{
468 int i, namelen, padbits;
469
470 namelen = strlen(name) + 2;
Kostya Shishkovf5c3eae2008-08-16 11:59:36471 put_bits(&s->pb, 3, TYPE_FIL);
Kostya Shishkovc03d9d02008-08-14 05:52:29472 put_bits(&s->pb, 4, FFMIN(namelen, 15));
Alex Conversefd257dc2009-07-08 20:36:45473 if (namelen >= 15)
Kostya Shishkovc03d9d02008-08-14 05:52:29474 put_bits(&s->pb, 8, namelen - 16);
475 put_bits(&s->pb, 4, 0); //extension type - filler
476 padbits = 8 - (put_bits_count(&s->pb) & 7);
477 align_put_bits(&s->pb);
Alex Conversefd257dc2009-07-08 20:36:45478 for (i = 0; i < namelen - 2; i++)
Kostya Shishkovc03d9d02008-08-14 05:52:29479 put_bits(&s->pb, 8, name[i]);
480 put_bits(&s->pb, 12 - padbits, 0);
481}
482
Alex Converse78e65cd2009-07-08 20:01:31483static int aac_encode_frame(AVCodecContext *avctx,
484 uint8_t *frame, int buf_size, void *data)
485{
486 AACEncContext *s = avctx->priv_data;
487 int16_t *samples = s->samples, *samples2, *la;
488 ChannelElement *cpe;
489 int i, j, chans, tag, start_ch;
490 const uint8_t *chan_map = aac_chan_configs[avctx->channels-1];
491 int chan_el_counter[4];
Måns Rullgård86e41bc32010-07-06 00:06:15492 FFPsyWindowInfo windows[AAC_MAX_CHANNELS];
Alex Converse78e65cd2009-07-08 20:01:31493
Alex Conversefd257dc2009-07-08 20:36:45494 if (s->last_frame)
Alex Converse78e65cd2009-07-08 20:01:31495 return 0;
Alex Conversefd257dc2009-07-08 20:36:45496 if (data) {
497 if (!s->psypp) {
Diego Biurrun99d61d32009-07-08 21:16:06498 memcpy(s->samples + 1024 * avctx->channels, data,
499 1024 * avctx->channels * sizeof(s->samples[0]));
Alex Conversefd257dc2009-07-08 20:36:45500 } else {
Alex Converse78e65cd2009-07-08 20:01:31501 start_ch = 0;
502 samples2 = s->samples + 1024 * avctx->channels;
Alex Conversefd257dc2009-07-08 20:36:45503 for (i = 0; i < chan_map[0]; i++) {
Alex Converse78e65cd2009-07-08 20:01:31504 tag = chan_map[i+1];
505 chans = tag == TYPE_CPE ? 2 : 1;
Diego Biurrun99d61d32009-07-08 21:16:06506 ff_psy_preprocess(s->psypp, (uint16_t*)data + start_ch,
507 samples2 + start_ch, start_ch, chans);
Alex Converse78e65cd2009-07-08 20:01:31508 start_ch += chans;
509 }
510 }
511 }
Alex Conversefd257dc2009-07-08 20:36:45512 if (!avctx->frame_number) {
Diego Biurrun99d61d32009-07-08 21:16:06513 memcpy(s->samples, s->samples + 1024 * avctx->channels,
514 1024 * avctx->channels * sizeof(s->samples[0]));
Alex Converse78e65cd2009-07-08 20:01:31515 return 0;
516 }
517
Alex Converse78e65cd2009-07-08 20:01:31518 start_ch = 0;
Alex Conversefd257dc2009-07-08 20:36:45519 for (i = 0; i < chan_map[0]; i++) {
Alex Converse5962f6b2009-07-08 23:10:13520 FFPsyWindowInfo* wi = windows + start_ch;
Diego Biurrun99d61d32009-07-08 21:16:06521 tag = chan_map[i+1];
522 chans = tag == TYPE_CPE ? 2 : 1;
523 cpe = &s->cpe[i];
Alex Conversefd257dc2009-07-08 20:36:45524 for (j = 0; j < chans; j++) {
Alex Converse78e65cd2009-07-08 20:01:31525 IndividualChannelStream *ics = &cpe->ch[j].ics;
526 int k;
Nathan Caldwell2bb1d0e2010-07-19 18:22:44527 int cur_channel = start_ch + j;
528 samples2 = samples + cur_channel;
529 la = samples2 + (448+64) * avctx->channels;
530 if (!data)
531 la = NULL;
Alex Converse03d5d9b2010-07-07 21:48:51532 if (tag == TYPE_LFE) {
533 wi[j].window_type[0] = ONLY_LONG_SEQUENCE;
534 wi[j].window_shape = 0;
535 wi[j].num_windows = 1;
536 wi[j].grouping[0] = 1;
537 } else {
Nathan Caldwell2bb1d0e2010-07-19 18:22:44538 wi[j] = ff_psy_suggest_window(&s->psy, samples2, la, cur_channel,
Alex Converse26784382010-07-07 21:50:50539 ics->window_sequence[0]);
Alex Converse03d5d9b2010-07-07 21:48:51540 }
Alex Converse78e65cd2009-07-08 20:01:31541 ics->window_sequence[1] = ics->window_sequence[0];
542 ics->window_sequence[0] = wi[j].window_type[0];
543 ics->use_kb_window[1] = ics->use_kb_window[0];
544 ics->use_kb_window[0] = wi[j].window_shape;
545 ics->num_windows = wi[j].num_windows;
546 ics->swb_sizes = s->psy.bands [ics->num_windows == 8];
Alex Converse03d5d9b2010-07-07 21:48:51547 ics->num_swb = tag == TYPE_LFE ? 12 : s->psy.num_bands[ics->num_windows == 8];
Alex Conversefd257dc2009-07-08 20:36:45548 for (k = 0; k < ics->num_windows; k++)
Alex Converse78e65cd2009-07-08 20:01:31549 ics->group_len[k] = wi[j].grouping[k];
550
Nathan Caldwell2bb1d0e2010-07-19 18:22:44551 apply_window_and_mdct(avctx, s, &cpe->ch[j], samples2);
Alex Converse5962f6b2009-07-08 23:10:13552 }
553 start_ch += chans;
554 }
Alex Converse48d20c12009-07-08 23:12:53555 do {
556 int frame_bits;
Alex Conversef11bfe32009-07-08 23:14:47557 init_put_bits(&s->pb, frame, buf_size*8);
558 if ((avctx->frame_number & 0xFF)==1 && !(avctx->flags & CODEC_FLAG_BITEXACT))
559 put_bitstream_info(avctx, s, LIBAVCODEC_IDENT);
560 start_ch = 0;
561 memset(chan_el_counter, 0, sizeof(chan_el_counter));
562 for (i = 0; i < chan_map[0]; i++) {
563 FFPsyWindowInfo* wi = windows + start_ch;
564 tag = chan_map[i+1];
565 chans = tag == TYPE_CPE ? 2 : 1;
566 cpe = &s->cpe[i];
Alex Converse8e4c11e2010-08-30 23:52:03567 put_bits(&s->pb, 3, tag);
568 put_bits(&s->pb, 4, chan_el_counter[tag]++);
Alex Conversef11bfe32009-07-08 23:14:47569 for (j = 0; j < chans; j++) {
Alex Converse495af352010-05-11 18:53:49570 s->cur_channel = start_ch + j;
Alex Converse31184aa2010-05-14 16:49:11571 ff_psy_set_band_info(&s->psy, s->cur_channel, cpe->ch[j].coeffs, &wi[j]);
Alex Conversef11bfe32009-07-08 23:14:47572 s->coder->search_for_quantizers(avctx, s, &cpe->ch[j], s->lambda);
573 }
574 cpe->common_window = 0;
575 if (chans > 1
576 && wi[0].window_type[0] == wi[1].window_type[0]
577 && wi[0].window_shape == wi[1].window_shape) {
Alex Converse78e65cd2009-07-08 20:01:31578
Alex Conversef11bfe32009-07-08 23:14:47579 cpe->common_window = 1;
580 for (j = 0; j < wi[0].num_windows; j++) {
581 if (wi[0].grouping[j] != wi[1].grouping[j]) {
582 cpe->common_window = 0;
583 break;
584 }
Alex Converse78e65cd2009-07-08 20:01:31585 }
586 }
Alex Converse495af352010-05-11 18:53:49587 s->cur_channel = start_ch;
Alex Conversef11bfe32009-07-08 23:14:47588 if (cpe->common_window && s->coder->search_for_ms)
589 s->coder->search_for_ms(s, cpe, s->lambda);
590 adjust_frame_information(s, cpe, chans);
Alex Conversef11bfe32009-07-08 23:14:47591 if (chans == 2) {
592 put_bits(&s->pb, 1, cpe->common_window);
593 if (cpe->common_window) {
594 put_ics_info(s, &cpe->ch[0].ics);
595 encode_ms_info(&s->pb, cpe);
596 }
Alex Converse78e65cd2009-07-08 20:01:31597 }
Alex Conversef11bfe32009-07-08 23:14:47598 for (j = 0; j < chans; j++) {
599 s->cur_channel = start_ch + j;
Alex Conversef11bfe32009-07-08 23:14:47600 encode_individual_channel(avctx, s, &cpe->ch[j], cpe->common_window);
601 }
602 start_ch += chans;
Alex Converse78e65cd2009-07-08 20:01:31603 }
Alex Converse78e65cd2009-07-08 20:01:31604
Alex Converse48d20c12009-07-08 23:12:53605 frame_bits = put_bits_count(&s->pb);
606 if (frame_bits <= 6144 * avctx->channels - 3)
607 break;
608
609 s->lambda *= avctx->bit_rate * 1024.0f / avctx->sample_rate / frame_bits;
610
611 } while (1);
612
Alex Converse78e65cd2009-07-08 20:01:31613 put_bits(&s->pb, 3, TYPE_END);
614 flush_put_bits(&s->pb);
615 avctx->frame_bits = put_bits_count(&s->pb);
616
617 // rate control stuff
Alex Conversefd257dc2009-07-08 20:36:45618 if (!(avctx->flags & CODEC_FLAG_QSCALE)) {
Alex Converse78e65cd2009-07-08 20:01:31619 float ratio = avctx->bit_rate * 1024.0f / avctx->sample_rate / avctx->frame_bits;
620 s->lambda *= ratio;
Alex Converse988c1702009-07-09 17:22:59621 s->lambda = FFMIN(s->lambda, 65536.f);
Alex Converse78e65cd2009-07-08 20:01:31622 }
623
Alex Conversefd257dc2009-07-08 20:36:45624 if (!data)
Alex Converse78e65cd2009-07-08 20:01:31625 s->last_frame = 1;
Diego Biurrun99d61d32009-07-08 21:16:06626 memcpy(s->samples, s->samples + 1024 * avctx->channels,
627 1024 * avctx->channels * sizeof(s->samples[0]));
Alex Converse78e65cd2009-07-08 20:01:31628 return put_bits_count(&s->pb)>>3;
629}
630
Kostya Shishkovc03d9d02008-08-14 05:52:29631static av_cold int aac_encode_end(AVCodecContext *avctx)
632{
633 AACEncContext *s = avctx->priv_data;
634
635 ff_mdct_end(&s->mdct1024);
636 ff_mdct_end(&s->mdct128);
Alex Converse78e65cd2009-07-08 20:01:31637 ff_psy_end(&s->psy);
638 ff_psy_preprocess_end(s->psypp);
Kostya Shishkovc03d9d02008-08-14 05:52:29639 av_freep(&s->samples);
640 av_freep(&s->cpe);
641 return 0;
642}
643
644AVCodec aac_encoder = {
645 "aac",
Stefano Sabatini72415b22010-03-30 23:30:55646 AVMEDIA_TYPE_AUDIO,
Kostya Shishkovc03d9d02008-08-14 05:52:29647 CODEC_ID_AAC,
648 sizeof(AACEncContext),
649 aac_encode_init,
650 aac_encode_frame,
651 aac_encode_end,
Alex Conversee84c2762010-05-27 14:46:31652 .capabilities = CODEC_CAP_SMALL_LAST_FRAME | CODEC_CAP_DELAY | CODEC_CAP_EXPERIMENTAL,
Stefano Sabatini5d6e4c12010-11-12 11:04:40653 .sample_fmts = (const enum AVSampleFormat[]){AV_SAMPLE_FMT_S16,AV_SAMPLE_FMT_NONE},
Kostya Shishkovc03d9d02008-08-14 05:52:29654 .long_name = NULL_IF_CONFIG_SMALL("Advanced Audio Coding"),
655};