blob: a1004c3e98358106cf4767f192cb655330baec50 [file] [log] [blame]
Kostya Shishkovc03d9d02008-08-14 05:52:291/*
2 * AAC encoder
3 * Copyright (C) 2008 Konstantin Shishkov
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22/**
Diego Biurrunba87f082010-04-20 14:45:3423 * @file
Kostya Shishkovc03d9d02008-08-14 05:52:2924 * AAC encoder
25 */
26
27/***********************************
28 * TODOs:
Kostya Shishkov817015e2008-08-16 05:47:1829 * add sane pulse detection
Kostya Shishkovc03d9d02008-08-14 05:52:2930 ***********************************/
Michael Niedermayera7a7f322021-05-28 19:37:2631#include <float.h>
Kostya Shishkovc03d9d02008-08-14 05:52:2932
Andreas Rheinhardt1be3d8a2021-06-11 23:10:5833#include "libavutil/channel_layout.h"
Ganesh Ajjanagadde2e4fd162016-01-14 22:55:5634#include "libavutil/libm.h"
Justin Rugglesd5a72292012-05-21 16:58:4135#include "libavutil/float_dsp.h"
Nathan Caldwellcc9947f2011-06-01 05:38:0936#include "libavutil/opt.h"
Kostya Shishkovc03d9d02008-08-14 05:52:2937#include "avcodec.h"
Andreas Rheinhardt56e9e022021-05-11 13:17:1338#include "encode.h"
Alex Converse78e65cd2009-07-08 20:01:3139#include "put_bits.h"
Justin Rugglesad953072012-01-28 17:28:0140#include "internal.h"
Kostya Shishkovc03d9d02008-08-14 05:52:2941#include "mpeg4audio.h"
Mans Rullgard45387292011-03-19 23:44:0042#include "sinewin.h"
Marton Balintaee036c2020-05-10 18:38:1143#include "profiles.h"
Kostya Shishkovc03d9d02008-08-14 05:52:2944
Kostya Shishkovc03d9d02008-08-14 05:52:2945#include "aac.h"
46#include "aactab.h"
Alex Converse78e65cd2009-07-08 20:01:3147#include "aacenc.h"
Rostislav Pehlivanovc47c7812015-07-29 04:44:2648#include "aacenctab.h"
Rostislav Pehlivanovef8e5a62015-07-29 04:44:2749#include "aacenc_utils.h"
Alex Converse78e65cd2009-07-08 20:01:3150
51#include "psymodel.h"
Kostya Shishkovc03d9d02008-08-14 05:52:2952
Rostislav Pehlivanovfbf295e2016-10-03 18:53:1153static void put_pce(PutBitContext *pb, AVCodecContext *avctx)
54{
55 int i, j;
56 AACEncContext *s = avctx->priv_data;
57 AACPCEInfo *pce = &s->pce;
Rostislav Pehlivanov7b7775a2017-11-09 04:30:0758 const int bitexact = avctx->flags & AV_CODEC_FLAG_BITEXACT;
59 const char *aux_data = bitexact ? "Lavc" : LIBAVCODEC_IDENT;
Rostislav Pehlivanovfbf295e2016-10-03 18:53:1160
61 put_bits(pb, 4, 0);
62
63 put_bits(pb, 2, avctx->profile);
64 put_bits(pb, 4, s->samplerate_index);
65
66 put_bits(pb, 4, pce->num_ele[0]); /* Front */
67 put_bits(pb, 4, pce->num_ele[1]); /* Side */
68 put_bits(pb, 4, pce->num_ele[2]); /* Back */
69 put_bits(pb, 2, pce->num_ele[3]); /* LFE */
70 put_bits(pb, 3, 0); /* Assoc data */
71 put_bits(pb, 4, 0); /* CCs */
72
73 put_bits(pb, 1, 0); /* Stereo mixdown */
74 put_bits(pb, 1, 0); /* Mono mixdown */
75 put_bits(pb, 1, 0); /* Something else */
76
77 for (i = 0; i < 4; i++) {
78 for (j = 0; j < pce->num_ele[i]; j++) {
79 if (i < 3)
80 put_bits(pb, 1, pce->pairing[i][j]);
81 put_bits(pb, 4, pce->index[i][j]);
82 }
83 }
84
Anton Khirnov717503f2020-10-26 12:36:0685 align_put_bits(pb);
Rostislav Pehlivanov7b7775a2017-11-09 04:30:0786 put_bits(pb, 8, strlen(aux_data));
Anton Khirnov944ba302020-10-26 12:41:3987 ff_put_string(pb, aux_data, 0);
Rostislav Pehlivanovfbf295e2016-10-03 18:53:1188}
89
Nathan Caldwell9b8e2a82011-12-15 02:43:5690/**
Kostya Shishkovc03d9d02008-08-14 05:52:2991 * Make AAC audio config object.
92 * @see 1.6.2.1 "Syntax - AudioSpecificConfig"
93 */
Rostislav Pehlivanov7b7775a2017-11-09 04:30:0794static int put_audio_specific_config(AVCodecContext *avctx)
Kostya Shishkovc03d9d02008-08-14 05:52:2995{
96 PutBitContext pb;
97 AACEncContext *s = avctx->priv_data;
Rostislav Pehlivanovfbf295e2016-10-03 18:53:1198 int channels = (!s->needs_pce)*(s->channels - (s->channels == 8 ? 1 : 0));
Rostislav Pehlivanov7b7775a2017-11-09 04:30:0799 const int max_size = 32;
Kostya Shishkovc03d9d02008-08-14 05:52:29100
Rostislav Pehlivanov7b7775a2017-11-09 04:30:07101 avctx->extradata = av_mallocz(max_size);
102 if (!avctx->extradata)
103 return AVERROR(ENOMEM);
104
105 init_put_bits(&pb, avctx->extradata, max_size);
Rostislav Pehlivanoveab12d02015-08-21 18:20:22106 put_bits(&pb, 5, s->profile+1); //profile
Kostya Shishkovc03d9d02008-08-14 05:52:29107 put_bits(&pb, 4, s->samplerate_index); //sample rate index
Rostislav Pehlivanovb3deaec2015-10-12 14:53:17108 put_bits(&pb, 4, channels);
Kostya Shishkovc03d9d02008-08-14 05:52:29109 //GASpecificConfig
110 put_bits(&pb, 1, 0); //frame length - 1024 samples
111 put_bits(&pb, 1, 0); //does not depend on core coder
112 put_bits(&pb, 1, 0); //is not extension
Rostislav Pehlivanovfbf295e2016-10-03 18:53:11113 if (s->needs_pce)
114 put_pce(&pb, avctx);
Alex Conversed67a6aa2011-01-22 05:23:43115
116 //Explicitly Mark SBR absent
Janne Grunau604eb1522011-01-23 14:45:19117 put_bits(&pb, 11, 0x2b7); //sync extension
Alex Conversed67a6aa2011-01-22 05:23:43118 put_bits(&pb, 5, AOT_SBR);
119 put_bits(&pb, 1, 0);
Kostya Shishkovc03d9d02008-08-14 05:52:29120 flush_put_bits(&pb);
Andreas Rheinhardtc81b8e02021-03-25 11:52:56121 avctx->extradata_size = put_bytes_output(&pb);
Rostislav Pehlivanov7b7775a2017-11-09 04:30:07122
123 return 0;
Kostya Shishkovc03d9d02008-08-14 05:52:29124}
125
Claudio Freireb629c672015-10-12 06:56:22126void ff_quantize_band_cost_cache_init(struct AACEncContext *s)
127{
Reimar Döffingerb91e3762016-03-06 16:28:42128 ++s->quantize_band_cost_cache_generation;
129 if (s->quantize_band_cost_cache_generation == 0) {
130 memset(s->quantize_band_cost_cache, 0, sizeof(s->quantize_band_cost_cache));
131 s->quantize_band_cost_cache_generation = 1;
Claudio Freireb629c672015-10-12 06:56:22132 }
133}
134
Nathan Caldwell9292fe42011-12-24 00:36:15135#define WINDOW_FUNC(type) \
Ronald S. Bultje42d32462013-01-20 21:20:30136static void apply_ ##type ##_window(AVFloatDSPContext *fdsp, \
Justin Rugglesd5a72292012-05-21 16:58:41137 SingleChannelElement *sce, \
138 const float *audio)
Nathan Caldwell9292fe42011-12-24 00:36:15139
140WINDOW_FUNC(only_long)
Kostya Shishkovc03d9d02008-08-14 05:52:29141{
Nathan Caldwell9292fe42011-12-24 00:36:15142 const float *lwindow = sce->ics.use_kb_window[0] ? ff_aac_kbd_long_1024 : ff_sine_1024;
143 const float *pwindow = sce->ics.use_kb_window[1] ? ff_aac_kbd_long_1024 : ff_sine_1024;
Michael Niedermayer59b68ee2012-11-26 14:15:02144 float *out = sce->ret_buf;
Kostya Shishkovc03d9d02008-08-14 05:52:29145
Ronald S. Bultje42d32462013-01-20 21:20:30146 fdsp->vector_fmul (out, audio, lwindow, 1024);
147 fdsp->vector_fmul_reverse(out + 1024, audio + 1024, pwindow, 1024);
Kostya Shishkovc03d9d02008-08-14 05:52:29148}
149
Nathan Caldwell9292fe42011-12-24 00:36:15150WINDOW_FUNC(long_start)
Alex Converse78e65cd2009-07-08 20:01:31151{
Nathan Caldwell9292fe42011-12-24 00:36:15152 const float *lwindow = sce->ics.use_kb_window[1] ? ff_aac_kbd_long_1024 : ff_sine_1024;
153 const float *swindow = sce->ics.use_kb_window[0] ? ff_aac_kbd_short_128 : ff_sine_128;
Michael Niedermayer59b68ee2012-11-26 14:15:02154 float *out = sce->ret_buf;
Nathan Caldwell9292fe42011-12-24 00:36:15155
Justin Rugglesd5a72292012-05-21 16:58:41156 fdsp->vector_fmul(out, audio, lwindow, 1024);
Nathan Caldwell2e626dd2012-01-28 05:23:41157 memcpy(out + 1024, audio + 1024, sizeof(out[0]) * 448);
Ronald S. Bultje42d32462013-01-20 21:20:30158 fdsp->vector_fmul_reverse(out + 1024 + 448, audio + 1024 + 448, swindow, 128);
Nathan Caldwell9292fe42011-12-24 00:36:15159 memset(out + 1024 + 576, 0, sizeof(out[0]) * 448);
160}
161
162WINDOW_FUNC(long_stop)
163{
164 const float *lwindow = sce->ics.use_kb_window[0] ? ff_aac_kbd_long_1024 : ff_sine_1024;
165 const float *swindow = sce->ics.use_kb_window[1] ? ff_aac_kbd_short_128 : ff_sine_128;
Michael Niedermayer59b68ee2012-11-26 14:15:02166 float *out = sce->ret_buf;
Nathan Caldwell9292fe42011-12-24 00:36:15167
168 memset(out, 0, sizeof(out[0]) * 448);
Justin Rugglesd5a72292012-05-21 16:58:41169 fdsp->vector_fmul(out + 448, audio + 448, swindow, 128);
Nathan Caldwell9292fe42011-12-24 00:36:15170 memcpy(out + 576, audio + 576, sizeof(out[0]) * 448);
Ronald S. Bultje42d32462013-01-20 21:20:30171 fdsp->vector_fmul_reverse(out + 1024, audio + 1024, lwindow, 1024);
Nathan Caldwell9292fe42011-12-24 00:36:15172}
173
174WINDOW_FUNC(eight_short)
175{
176 const float *swindow = sce->ics.use_kb_window[0] ? ff_aac_kbd_short_128 : ff_sine_128;
177 const float *pwindow = sce->ics.use_kb_window[1] ? ff_aac_kbd_short_128 : ff_sine_128;
178 const float *in = audio + 448;
Michael Niedermayer59b68ee2012-11-26 14:15:02179 float *out = sce->ret_buf;
Mans Rullgard3715d8412012-01-29 20:55:10180 int w;
Nathan Caldwell9292fe42011-12-24 00:36:15181
Mans Rullgard3715d8412012-01-29 20:55:10182 for (w = 0; w < 8; w++) {
Ronald S. Bultje42d32462013-01-20 21:20:30183 fdsp->vector_fmul (out, in, w ? pwindow : swindow, 128);
Nathan Caldwell9292fe42011-12-24 00:36:15184 out += 128;
185 in += 128;
Ronald S. Bultje42d32462013-01-20 21:20:30186 fdsp->vector_fmul_reverse(out, in, swindow, 128);
Nathan Caldwell9292fe42011-12-24 00:36:15187 out += 128;
188 }
189}
190
Ronald S. Bultje42d32462013-01-20 21:20:30191static void (*const apply_window[4])(AVFloatDSPContext *fdsp,
Justin Rugglesd5a72292012-05-21 16:58:41192 SingleChannelElement *sce,
193 const float *audio) = {
Nathan Caldwell9292fe42011-12-24 00:36:15194 [ONLY_LONG_SEQUENCE] = apply_only_long_window,
195 [LONG_START_SEQUENCE] = apply_long_start_window,
196 [EIGHT_SHORT_SEQUENCE] = apply_eight_short_window,
197 [LONG_STOP_SEQUENCE] = apply_long_stop_window
198};
199
Nathan Caldwell04af2ef2011-12-07 22:20:10200static void apply_window_and_mdct(AACEncContext *s, SingleChannelElement *sce,
201 float *audio)
Alex Converse78e65cd2009-07-08 20:01:31202{
Nathan Caldwell9292fe42011-12-24 00:36:15203 int i;
Michael Niedermayer90065672016-01-13 15:40:22204 const float *output = sce->ret_buf;
Alex Converse78e65cd2009-07-08 20:01:31205
Michael Niedermayer14285c32014-11-29 17:58:13206 apply_window[sce->ics.window_sequence[0]](s->fdsp, sce, audio);
Nathan Caldwell9292fe42011-12-24 00:36:15207
208 if (sce->ics.window_sequence[0] != EIGHT_SHORT_SEQUENCE)
Mans Rullgard26f548b2011-03-19 15:14:17209 s->mdct1024.mdct_calc(&s->mdct1024, sce->coeffs, output);
Nathan Caldwell9292fe42011-12-24 00:36:15210 else
211 for (i = 0; i < 1024; i += 128)
Rostislav Pehlivanov32be2642015-08-21 17:30:51212 s->mdct128.mdct_calc(&s->mdct128, &sce->coeffs[i], output + i*2);
Nathan Caldwell9292fe42011-12-24 00:36:15213 memcpy(audio, audio + 1024, sizeof(audio[0]) * 1024);
Claudio Freire6394aca2015-03-03 06:43:06214 memcpy(sce->pcoeffs, sce->coeffs, sizeof(sce->pcoeffs));
Alex Converse78e65cd2009-07-08 20:01:31215}
216
Kostya Shishkovc03d9d02008-08-14 05:52:29217/**
218 * Encode ics_info element.
219 * @see Table 4.6 (syntax of ics_info)
220 */
Kostya Shishkove43b0a72008-08-24 05:56:23221static void put_ics_info(AACEncContext *s, IndividualChannelStream *info)
Kostya Shishkovc03d9d02008-08-14 05:52:29222{
Alex Converse78e65cd2009-07-08 20:01:31223 int w;
Kostya Shishkovc03d9d02008-08-14 05:52:29224
225 put_bits(&s->pb, 1, 0); // ics_reserved bit
226 put_bits(&s->pb, 2, info->window_sequence[0]);
227 put_bits(&s->pb, 1, info->use_kb_window[0]);
Alex Conversefd257dc2009-07-08 20:36:45228 if (info->window_sequence[0] != EIGHT_SHORT_SEQUENCE) {
Kostya Shishkovc03d9d02008-08-14 05:52:29229 put_bits(&s->pb, 6, info->max_sfb);
Rostislav Pehlivanov76b81b12015-08-21 18:38:05230 put_bits(&s->pb, 1, !!info->predictor_present);
Alex Conversefd257dc2009-07-08 20:36:45231 } else {
Kostya Shishkovc03d9d02008-08-14 05:52:29232 put_bits(&s->pb, 4, info->max_sfb);
Diego Biurrunc8f47d82009-07-08 21:36:33233 for (w = 1; w < 8; w++)
Alex Converse78e65cd2009-07-08 20:01:31234 put_bits(&s->pb, 1, !info->group_len[w]);
Kostya Shishkovc03d9d02008-08-14 05:52:29235 }
236}
237
238/**
Alex Converse78e65cd2009-07-08 20:01:31239 * Encode MS data.
240 * @see 4.6.8.1 "Joint Coding - M/S Stereo"
Kostya Shishkove43b0a72008-08-24 05:56:23241 */
Alex Converse78e65cd2009-07-08 20:01:31242static void encode_ms_info(PutBitContext *pb, ChannelElement *cpe)
Kostya Shishkove43b0a72008-08-24 05:56:23243{
Kostya Shishkove43b0a72008-08-24 05:56:23244 int i, w;
Alex Converse78e65cd2009-07-08 20:01:31245
246 put_bits(pb, 2, cpe->ms_mode);
Diego Biurrunc8f47d82009-07-08 21:36:33247 if (cpe->ms_mode == 1)
248 for (w = 0; w < cpe->ch[0].ics.num_windows; w += cpe->ch[0].ics.group_len[w])
Alex Conversefd257dc2009-07-08 20:36:45249 for (i = 0; i < cpe->ch[0].ics.max_sfb; i++)
Alex Converse78e65cd2009-07-08 20:01:31250 put_bits(pb, 1, cpe->ms_mask[w*16 + i]);
Alex Converse78e65cd2009-07-08 20:01:31251}
252
253/**
254 * Produce integer coefficients from scalefactors provided by the model.
255 */
Diego Biurrun72c758f2012-10-24 17:16:08256static void adjust_frame_information(ChannelElement *cpe, int chans)
Alex Converse78e65cd2009-07-08 20:01:31257{
258 int i, w, w2, g, ch;
Rostislav Pehlivanov0b233902015-07-02 18:13:06259 int maxsfb, cmaxsfb;
Rostislav Pehlivanov0b233902015-07-02 18:13:06260
261 for (ch = 0; ch < chans; ch++) {
262 IndividualChannelStream *ics = &cpe->ch[ch].ics;
263 maxsfb = 0;
264 cpe->ch[ch].pulse.num_pulse = 0;
265 for (w = 0; w < ics->num_windows; w += ics->group_len[w]) {
266 for (w2 = 0; w2 < ics->group_len[w]; w2++) {
Claudio Freire6394aca2015-03-03 06:43:06267 for (cmaxsfb = ics->num_swb; cmaxsfb > 0 && cpe->ch[ch].zeroes[w*16+cmaxsfb-1]; cmaxsfb--)
268 ;
269 maxsfb = FFMAX(maxsfb, cmaxsfb);
Alex Converse78e65cd2009-07-08 20:01:31270 }
Alex Converse78e65cd2009-07-08 20:01:31271 }
272 ics->max_sfb = maxsfb;
273
274 //adjust zero bands for window groups
Alex Conversefd257dc2009-07-08 20:36:45275 for (w = 0; w < ics->num_windows; w += ics->group_len[w]) {
276 for (g = 0; g < ics->max_sfb; g++) {
Alex Converse78e65cd2009-07-08 20:01:31277 i = 1;
Alex Conversefd257dc2009-07-08 20:36:45278 for (w2 = w; w2 < w + ics->group_len[w]; w2++) {
279 if (!cpe->ch[ch].zeroes[w2*16 + g]) {
Alex Converse78e65cd2009-07-08 20:01:31280 i = 0;
281 break;
282 }
283 }
284 cpe->ch[ch].zeroes[w*16 + g] = i;
285 }
286 }
287 }
288
Alex Conversefd257dc2009-07-08 20:36:45289 if (chans > 1 && cpe->common_window) {
Alex Converse78e65cd2009-07-08 20:01:31290 IndividualChannelStream *ics0 = &cpe->ch[0].ics;
291 IndividualChannelStream *ics1 = &cpe->ch[1].ics;
292 int msc = 0;
293 ics0->max_sfb = FFMAX(ics0->max_sfb, ics1->max_sfb);
294 ics1->max_sfb = ics0->max_sfb;
Alex Conversefd257dc2009-07-08 20:36:45295 for (w = 0; w < ics0->num_windows*16; w += 16)
296 for (i = 0; i < ics0->max_sfb; i++)
Diego Biurrunc8f47d82009-07-08 21:36:33297 if (cpe->ms_mask[w+i])
298 msc++;
Diego Biurrun99d61d32009-07-08 21:16:06299 if (msc == 0 || ics0->max_sfb == 0)
300 cpe->ms_mode = 0;
301 else
Nathan Caldwell98add742011-06-29 03:11:39302 cpe->ms_mode = msc < ics0->max_sfb * ics0->num_windows ? 1 : 2;
Alex Converse78e65cd2009-07-08 20:01:31303 }
304}
305
Rostislav Pehlivanov20dc5272015-09-02 05:26:45306static void apply_intensity_stereo(ChannelElement *cpe)
307{
308 int w, w2, g, i;
309 IndividualChannelStream *ics = &cpe->ch[0].ics;
310 if (!cpe->common_window)
311 return;
312 for (w = 0; w < ics->num_windows; w += ics->group_len[w]) {
313 for (w2 = 0; w2 < ics->group_len[w]; w2++) {
314 int start = (w+w2) * 128;
315 for (g = 0; g < ics->num_swb; g++) {
316 int p = -1 + 2 * (cpe->ch[1].band_type[w*16+g] - 14);
317 float scale = cpe->ch[0].is_ener[w*16+g];
318 if (!cpe->is_mask[w*16 + g]) {
319 start += ics->swb_sizes[g];
320 continue;
321 }
Claudio Freire01ecb712015-10-11 20:29:50322 if (cpe->ms_mask[w*16 + g])
323 p *= -1;
Rostislav Pehlivanov20dc5272015-09-02 05:26:45324 for (i = 0; i < ics->swb_sizes[g]; i++) {
325 float sum = (cpe->ch[0].coeffs[start+i] + p*cpe->ch[1].coeffs[start+i])*scale;
326 cpe->ch[0].coeffs[start+i] = sum;
327 cpe->ch[1].coeffs[start+i] = 0.0f;
328 }
329 start += ics->swb_sizes[g];
330 }
331 }
332 }
333}
334
335static void apply_mid_side_stereo(ChannelElement *cpe)
336{
337 int w, w2, g, i;
338 IndividualChannelStream *ics = &cpe->ch[0].ics;
339 if (!cpe->common_window)
340 return;
341 for (w = 0; w < ics->num_windows; w += ics->group_len[w]) {
342 for (w2 = 0; w2 < ics->group_len[w]; w2++) {
343 int start = (w+w2) * 128;
344 for (g = 0; g < ics->num_swb; g++) {
Claudio Freirefc36d852015-11-26 06:27:06345 /* ms_mask can be used for other purposes in PNS and I/S,
346 * so must not apply M/S if any band uses either, even if
347 * ms_mask is set.
348 */
349 if (!cpe->ms_mask[w*16 + g] || cpe->is_mask[w*16 + g]
Claudio Freire509f1682016-01-08 08:04:37350 || cpe->ch[0].band_type[w*16 + g] >= NOISE_BT
351 || cpe->ch[1].band_type[w*16 + g] >= NOISE_BT) {
Rostislav Pehlivanov20dc5272015-09-02 05:26:45352 start += ics->swb_sizes[g];
353 continue;
354 }
355 for (i = 0; i < ics->swb_sizes[g]; i++) {
356 float L = (cpe->ch[0].coeffs[start+i] + cpe->ch[1].coeffs[start+i]) * 0.5f;
357 float R = L - cpe->ch[1].coeffs[start+i];
358 cpe->ch[0].coeffs[start+i] = L;
359 cpe->ch[1].coeffs[start+i] = R;
360 }
361 start += ics->swb_sizes[g];
362 }
363 }
364 }
365}
366
Alex Converse78e65cd2009-07-08 20:01:31367/**
368 * Encode scalefactor band coding type.
369 */
370static void encode_band_info(AACEncContext *s, SingleChannelElement *sce)
371{
372 int w;
373
Rostislav Pehlivanov20dc5272015-09-02 05:26:45374 if (s->coder->set_special_band_scalefactors)
375 s->coder->set_special_band_scalefactors(s, sce);
376
Diego Biurrunc8f47d82009-07-08 21:36:33377 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w])
Alex Converse78e65cd2009-07-08 20:01:31378 s->coder->encode_window_bands_info(s, sce, w, sce->ics.group_len[w], s->lambda);
Alex Converse78e65cd2009-07-08 20:01:31379}
380
381/**
382 * Encode scalefactors.
383 */
Diego Biurrun99d61d32009-07-08 21:16:06384static void encode_scale_factors(AVCodecContext *avctx, AACEncContext *s,
385 SingleChannelElement *sce)
Alex Converse78e65cd2009-07-08 20:01:31386{
Rostislav Pehlivanov013498b2015-04-13 23:33:51387 int diff, off_sf = sce->sf_idx[0], off_pns = sce->sf_idx[0] - NOISE_OFFSET;
Rostislav Pehlivanov7c10b872015-06-26 20:16:34388 int off_is = 0, noise_flag = 1;
Alex Converse78e65cd2009-07-08 20:01:31389 int i, w;
390
Alex Conversefd257dc2009-07-08 20:36:45391 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
392 for (i = 0; i < sce->ics.max_sfb; i++) {
393 if (!sce->zeroes[w*16 + i]) {
Rostislav Pehlivanovf7f71b52015-04-12 04:50:34394 if (sce->band_type[w*16 + i] == NOISE_BT) {
395 diff = sce->sf_idx[w*16 + i] - off_pns;
396 off_pns = sce->sf_idx[w*16 + i];
397 if (noise_flag-- > 0) {
398 put_bits(&s->pb, NOISE_PRE_BITS, diff + NOISE_PRE);
399 continue;
400 }
Rostislav Pehlivanov7c10b872015-06-26 20:16:34401 } else if (sce->band_type[w*16 + i] == INTENSITY_BT ||
402 sce->band_type[w*16 + i] == INTENSITY_BT2) {
403 diff = sce->sf_idx[w*16 + i] - off_is;
404 off_is = sce->sf_idx[w*16 + i];
Rostislav Pehlivanovf7f71b52015-04-12 04:50:34405 } else {
406 diff = sce->sf_idx[w*16 + i] - off_sf;
407 off_sf = sce->sf_idx[w*16 + i];
408 }
409 diff += SCALE_DIFF_ZERO;
Michael Niedermayerf69f9b32012-10-26 00:11:20410 av_assert0(diff >= 0 && diff <= 120);
Alex Converse78e65cd2009-07-08 20:01:31411 put_bits(&s->pb, ff_aac_scalefactor_bits[diff], ff_aac_scalefactor_code[diff]);
412 }
413 }
414 }
Kostya Shishkove43b0a72008-08-24 05:56:23415}
416
417/**
Kostya Shishkov817015e2008-08-16 05:47:18418 * Encode pulse data.
419 */
Kostya Shishkovcda00de2008-08-23 15:25:57420static void encode_pulses(AACEncContext *s, Pulse *pulse)
Kostya Shishkov817015e2008-08-16 05:47:18421{
422 int i;
423
424 put_bits(&s->pb, 1, !!pulse->num_pulse);
Diego Biurrun99d61d32009-07-08 21:16:06425 if (!pulse->num_pulse)
426 return;
Kostya Shishkov817015e2008-08-16 05:47:18427
428 put_bits(&s->pb, 2, pulse->num_pulse - 1);
429 put_bits(&s->pb, 6, pulse->start);
Alex Conversefd257dc2009-07-08 20:36:45430 for (i = 0; i < pulse->num_pulse; i++) {
Kostya Shishkovf5c3eae2008-08-16 11:59:36431 put_bits(&s->pb, 5, pulse->pos[i]);
Kostya Shishkov817015e2008-08-16 05:47:18432 put_bits(&s->pb, 4, pulse->amp[i]);
433 }
434}
435
436/**
437 * Encode spectral coefficients processed by psychoacoustic model.
438 */
Kostya Shishkovcda00de2008-08-23 15:25:57439static void encode_spectral_coeffs(AACEncContext *s, SingleChannelElement *sce)
Kostya Shishkov817015e2008-08-16 05:47:18440{
Alex Converse78e65cd2009-07-08 20:01:31441 int start, i, w, w2;
Kostya Shishkov817015e2008-08-16 05:47:18442
Alex Conversefd257dc2009-07-08 20:36:45443 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Kostya Shishkov817015e2008-08-16 05:47:18444 start = 0;
Alex Conversefd257dc2009-07-08 20:36:45445 for (i = 0; i < sce->ics.max_sfb; i++) {
446 if (sce->zeroes[w*16 + i]) {
Kostya Shishkovcda00de2008-08-23 15:25:57447 start += sce->ics.swb_sizes[i];
Kostya Shishkov817015e2008-08-16 05:47:18448 continue;
449 }
Rostislav Pehlivanov44ddee92015-08-29 05:34:08450 for (w2 = w; w2 < w + sce->ics.group_len[w]; w2++) {
Rostislav Pehlivanov43b378a2015-08-21 17:53:14451 s->coder->quantize_and_encode_band(s, &s->pb,
452 &sce->coeffs[start + w2*128],
Rostislav Pehlivanov44ddee92015-08-29 05:34:08453 NULL, sce->ics.swb_sizes[i],
Diego Biurrun99d61d32009-07-08 21:16:06454 sce->sf_idx[w*16 + i],
455 sce->band_type[w*16 + i],
Rostislav Pehlivanov43b378a2015-08-21 17:53:14456 s->lambda,
457 sce->ics.window_clipping[w]);
Rostislav Pehlivanov44ddee92015-08-29 05:34:08458 }
Kostya Shishkovcda00de2008-08-23 15:25:57459 start += sce->ics.swb_sizes[i];
Kostya Shishkov817015e2008-08-16 05:47:18460 }
Kostya Shishkov817015e2008-08-16 05:47:18461 }
462}
463
464/**
Claudio Freire59216e02015-07-21 01:53:24465 * Downscale spectral coefficients for near-clipping windows to avoid artifacts
466 */
467static void avoid_clipping(AACEncContext *s, SingleChannelElement *sce)
468{
469 int start, i, j, w;
470
471 if (sce->ics.clip_avoidance_factor < 1.0f) {
472 for (w = 0; w < sce->ics.num_windows; w++) {
473 start = 0;
474 for (i = 0; i < sce->ics.max_sfb; i++) {
Rostislav Pehlivanov32be2642015-08-21 17:30:51475 float *swb_coeffs = &sce->coeffs[start + w*128];
Claudio Freire59216e02015-07-21 01:53:24476 for (j = 0; j < sce->ics.swb_sizes[i]; j++)
477 swb_coeffs[j] *= sce->ics.clip_avoidance_factor;
478 start += sce->ics.swb_sizes[i];
479 }
480 }
481 }
482}
483
484/**
Alex Converse78e65cd2009-07-08 20:01:31485 * Encode one channel of audio data.
486 */
Diego Biurrun99d61d32009-07-08 21:16:06487static int encode_individual_channel(AVCodecContext *avctx, AACEncContext *s,
488 SingleChannelElement *sce,
489 int common_window)
Alex Converse78e65cd2009-07-08 20:01:31490{
491 put_bits(&s->pb, 8, sce->sf_idx[0]);
Rostislav Pehlivanov76b81b12015-08-21 18:38:05492 if (!common_window) {
Diego Biurrun99d61d32009-07-08 21:16:06493 put_ics_info(s, &sce->ics);
Rostislav Pehlivanov76b81b12015-08-21 18:38:05494 if (s->coder->encode_main_pred)
495 s->coder->encode_main_pred(s, sce);
Rostislav Pehlivanov27d23ae2015-10-17 01:22:51496 if (s->coder->encode_ltp_info)
497 s->coder->encode_ltp_info(s, sce, 0);
Rostislav Pehlivanov76b81b12015-08-21 18:38:05498 }
Alex Converse78e65cd2009-07-08 20:01:31499 encode_band_info(s, sce);
500 encode_scale_factors(avctx, s, sce);
501 encode_pulses(s, &sce->pulse);
Rostislav Pehlivanovf20b6712015-08-29 05:47:31502 put_bits(&s->pb, 1, !!sce->tns.present);
Rostislav Pehlivanova1c487e2015-08-21 18:27:38503 if (s->coder->encode_tns_info)
504 s->coder->encode_tns_info(s, sce);
Alex Converse78e65cd2009-07-08 20:01:31505 put_bits(&s->pb, 1, 0); //ssr
506 encode_spectral_coeffs(s, sce);
507 return 0;
508}
509
510/**
Kostya Shishkovc03d9d02008-08-14 05:52:29511 * Write some auxiliary information about the created AAC file.
512 */
Diego Biurrun72c758f2012-10-24 17:16:08513static void put_bitstream_info(AACEncContext *s, const char *name)
Kostya Shishkovc03d9d02008-08-14 05:52:29514{
515 int i, namelen, padbits;
516
517 namelen = strlen(name) + 2;
Kostya Shishkovf5c3eae2008-08-16 11:59:36518 put_bits(&s->pb, 3, TYPE_FIL);
Kostya Shishkovc03d9d02008-08-14 05:52:29519 put_bits(&s->pb, 4, FFMIN(namelen, 15));
Alex Conversefd257dc2009-07-08 20:36:45520 if (namelen >= 15)
Michael Niedermayer018a6642012-01-22 00:40:10521 put_bits(&s->pb, 8, namelen - 14);
Kostya Shishkovc03d9d02008-08-14 05:52:29522 put_bits(&s->pb, 4, 0); //extension type - filler
Alex Converseefe68072012-01-23 21:08:32523 padbits = -put_bits_count(&s->pb) & 7;
Anton Khirnov717503f2020-10-26 12:36:06524 align_put_bits(&s->pb);
Alex Conversefd257dc2009-07-08 20:36:45525 for (i = 0; i < namelen - 2; i++)
Kostya Shishkovc03d9d02008-08-14 05:52:29526 put_bits(&s->pb, 8, name[i]);
527 put_bits(&s->pb, 12 - padbits, 0);
528}
529
Nathan Caldwell9b8e2a82011-12-15 02:43:56530/*
Justin Rugglesf3e2d682012-08-25 17:04:33531 * Copy input samples.
Michael Niedermayer4b4d3d72012-02-01 02:46:11532 * Channels are reordered from libavcodec's default order to AAC order.
Nathan Caldwell9b8e2a82011-12-15 02:43:56533 */
Justin Rugglesf3e2d682012-08-25 17:04:33534static void copy_input_samples(AACEncContext *s, const AVFrame *frame)
Nathan Caldwell9b8e2a82011-12-15 02:43:56535{
Justin Rugglesf3e2d682012-08-25 17:04:33536 int ch;
537 int end = 2048 + (frame ? frame->nb_samples : 0);
Rostislav Pehlivanovfbf295e2016-10-03 18:53:11538 const uint8_t *channel_map = s->reorder_map;
Nathan Caldwell9b8e2a82011-12-15 02:43:56539
Justin Rugglesf3e2d682012-08-25 17:04:33540 /* copy and remap input samples */
541 for (ch = 0; ch < s->channels; ch++) {
Nathan Caldwell9b8e2a82011-12-15 02:43:56542 /* copy last 1024 samples of previous frame to the start of the current frame */
Nathan Caldwelldc7e7d42012-01-28 05:23:40543 memcpy(&s->planar_samples[ch][1024], &s->planar_samples[ch][2048], 1024 * sizeof(s->planar_samples[0][0]));
Nathan Caldwell9b8e2a82011-12-15 02:43:56544
Justin Rugglesf3e2d682012-08-25 17:04:33545 /* copy new samples and zero any remaining samples */
Justin Rugglesad953072012-01-28 17:28:01546 if (frame) {
Justin Rugglesf3e2d682012-08-25 17:04:33547 memcpy(&s->planar_samples[ch][2048],
548 frame->extended_data[channel_map[ch]],
549 frame->nb_samples * sizeof(s->planar_samples[0][0]));
Nathan Caldwell9b8e2a82011-12-15 02:43:56550 }
Justin Rugglesf3e2d682012-08-25 17:04:33551 memset(&s->planar_samples[ch][end], 0,
552 (3072 - end) * sizeof(s->planar_samples[0][0]));
Nathan Caldwell9b8e2a82011-12-15 02:43:56553 }
554}
555
Justin Rugglesad953072012-01-28 17:28:01556static int aac_encode_frame(AVCodecContext *avctx, AVPacket *avpkt,
557 const AVFrame *frame, int *got_packet_ptr)
Alex Converse78e65cd2009-07-08 20:01:31558{
559 AACEncContext *s = avctx->priv_data;
Nathan Caldwell7946a5a2011-12-24 22:24:16560 float **samples = s->planar_samples, *samples2, *la, *overlap;
Alex Converse78e65cd2009-07-08 20:01:31561 ChannelElement *cpe;
Rostislav Pehlivanovd1ca7142015-08-21 18:13:26562 SingleChannelElement *sce;
Rostislav Pehlivanov2d9b5ae2015-10-17 01:13:00563 IndividualChannelStream *ics;
Claudio Freire7ec74ae2015-09-23 05:13:56564 int i, its, ch, w, chans, tag, start_ch, ret, frame_bits;
Claudio Freire01ecb712015-10-11 20:29:50565 int target_bits, rate_bits, too_many_bits, too_few_bits;
Rostislav Pehlivanovd1ca7142015-08-21 18:13:26566 int ms_mode = 0, is_mode = 0, tns_mode = 0, pred_mode = 0;
Alex Converse78e65cd2009-07-08 20:01:31567 int chan_el_counter[4];
Måns Rullgård86e41bc32010-07-06 00:06:15568 FFPsyWindowInfo windows[AAC_MAX_CHANNELS];
Alex Converse78e65cd2009-07-08 20:01:31569
Justin Rugglesad953072012-01-28 17:28:01570 /* add current frame to queue */
571 if (frame) {
Michael Niedermayer98fed592013-01-13 23:02:50572 if ((ret = ff_af_queue_add(&s->afq, frame)) < 0)
Justin Rugglesad953072012-01-28 17:28:01573 return ret;
Rostislav Pehlivanov0cf68532016-11-07 02:11:50574 } else {
575 if (!s->afq.remaining_samples || (!s->afq.frame_alloc && !s->afq.frame_count))
576 return 0;
Justin Rugglesad953072012-01-28 17:28:01577 }
578
Justin Rugglesf3e2d682012-08-25 17:04:33579 copy_input_samples(s, frame);
Justin Ruggles89eea6d2012-01-28 22:51:22580 if (s->psypp)
581 ff_psy_preprocess(s->psypp, s->planar_samples, s->channels);
Nathan Caldwell9b8e2a82011-12-15 02:43:56582
583 if (!avctx->frame_number)
Alex Converse78e65cd2009-07-08 20:01:31584 return 0;
Alex Converse78e65cd2009-07-08 20:01:31585
Alex Converse78e65cd2009-07-08 20:01:31586 start_ch = 0;
Nathan Caldwell1bb52042011-06-20 04:29:37587 for (i = 0; i < s->chan_map[0]; i++) {
Alex Converse5962f6b2009-07-08 23:10:13588 FFPsyWindowInfo* wi = windows + start_ch;
Nathan Caldwell1bb52042011-06-20 04:29:37589 tag = s->chan_map[i+1];
Diego Biurrun99d61d32009-07-08 21:16:06590 chans = tag == TYPE_CPE ? 2 : 1;
591 cpe = &s->cpe[i];
Nathan Caldwell5b29af62011-05-06 07:19:51592 for (ch = 0; ch < chans; ch++) {
Michael Niedermayer2cb8ede2016-01-20 14:05:38593 int k;
Michael Niedermayerc38a6072015-10-17 11:40:04594 float clip_avoidance_factor;
Rostislav Pehlivanov2d9b5ae2015-10-17 01:13:00595 sce = &cpe->ch[ch];
596 ics = &sce->ics;
597 s->cur_channel = start_ch + ch;
Rostislav Pehlivanov2d9b5ae2015-10-17 01:13:00598 overlap = &samples[s->cur_channel][0];
Nathan Caldwell7946a5a2011-12-24 22:24:16599 samples2 = overlap + 1024;
Nathan Caldwell9b8e2a82011-12-15 02:43:56600 la = samples2 + (448+64);
Justin Rugglesad953072012-01-28 17:28:01601 if (!frame)
Nathan Caldwell2bb1d0e2010-07-19 18:22:44602 la = NULL;
Alex Converse03d5d9b2010-07-07 21:48:51603 if (tag == TYPE_LFE) {
Claudio Freire8005b6d2016-04-06 02:13:44604 wi[ch].window_type[0] = wi[ch].window_type[1] = ONLY_LONG_SEQUENCE;
Nathan Caldwell5b29af62011-05-06 07:19:51605 wi[ch].window_shape = 0;
606 wi[ch].num_windows = 1;
607 wi[ch].grouping[0] = 1;
Claudio Freire8005b6d2016-04-06 02:13:44608 wi[ch].clipping[0] = 0;
Nathan Caldwell24efdea2011-07-29 20:49:04609
610 /* Only the lowest 12 coefficients are used in a LFE channel.
611 * The expression below results in only the bottom 8 coefficients
612 * being used for 11.025kHz to 16kHz sample rates.
613 */
614 ics->num_swb = s->samplerate_index >= 8 ? 1 : 3;
Alex Converse03d5d9b2010-07-07 21:48:51615 } else {
Rostislav Pehlivanov2d9b5ae2015-10-17 01:13:00616 wi[ch] = s->psy.model->window(&s->psy, samples2, la, s->cur_channel,
Alex Converse26784382010-07-07 21:50:50617 ics->window_sequence[0]);
Alex Converse03d5d9b2010-07-07 21:48:51618 }
Alex Converse78e65cd2009-07-08 20:01:31619 ics->window_sequence[1] = ics->window_sequence[0];
Nathan Caldwell5b29af62011-05-06 07:19:51620 ics->window_sequence[0] = wi[ch].window_type[0];
Alex Converse78e65cd2009-07-08 20:01:31621 ics->use_kb_window[1] = ics->use_kb_window[0];
Nathan Caldwell5b29af62011-05-06 07:19:51622 ics->use_kb_window[0] = wi[ch].window_shape;
623 ics->num_windows = wi[ch].num_windows;
Alex Converse78e65cd2009-07-08 20:01:31624 ics->swb_sizes = s->psy.bands [ics->num_windows == 8];
Nathan Caldwell24efdea2011-07-29 20:49:04625 ics->num_swb = tag == TYPE_LFE ? ics->num_swb : s->psy.num_bands[ics->num_windows == 8];
Andreas Cadhalpun5b0da692015-12-06 20:35:08626 ics->max_sfb = FFMIN(ics->max_sfb, ics->num_swb);
Rostislav Pehlivanov23e786b2015-08-21 17:40:44627 ics->swb_offset = wi[ch].window_type[0] == EIGHT_SHORT_SEQUENCE ?
628 ff_swb_offset_128 [s->samplerate_index]:
629 ff_swb_offset_1024[s->samplerate_index];
Rostislav Pehlivanov5ed5ca72015-09-01 05:20:24630 ics->tns_max_bands = wi[ch].window_type[0] == EIGHT_SHORT_SEQUENCE ?
631 ff_tns_max_bands_128 [s->samplerate_index]:
632 ff_tns_max_bands_1024[s->samplerate_index];
Claudio Freire8005b6d2016-04-06 02:13:44633
Nathan Caldwell5b29af62011-05-06 07:19:51634 for (w = 0; w < ics->num_windows; w++)
635 ics->group_len[w] = wi[ch].grouping[w];
Claudio Freire8005b6d2016-04-06 02:13:44636
637 /* Calculate input sample maximums and evaluate clipping risk */
638 clip_avoidance_factor = 0.0f;
639 for (w = 0; w < ics->num_windows; w++) {
640 const float *wbuf = overlap + w * 128;
641 const int wlen = 2048 / ics->num_windows;
642 float max = 0;
643 int j;
644 /* mdct input is 2 * output */
645 for (j = 0; j < wlen; j++)
646 max = FFMAX(max, fabsf(wbuf[j]));
647 wi[ch].clipping[w] = max;
648 }
Claudio Freire59216e02015-07-21 01:53:24649 for (w = 0; w < ics->num_windows; w++) {
650 if (wi[ch].clipping[w] > CLIP_AVOIDANCE_FACTOR) {
651 ics->window_clipping[w] = 1;
652 clip_avoidance_factor = FFMAX(clip_avoidance_factor, wi[ch].clipping[w]);
653 } else {
654 ics->window_clipping[w] = 0;
655 }
656 }
657 if (clip_avoidance_factor > CLIP_AVOIDANCE_FACTOR) {
658 ics->clip_avoidance_factor = CLIP_AVOIDANCE_FACTOR / clip_avoidance_factor;
659 } else {
660 ics->clip_avoidance_factor = 1.0f;
661 }
Alex Converse78e65cd2009-07-08 20:01:31662
Rostislav Pehlivanov2d9b5ae2015-10-17 01:13:00663 apply_window_and_mdct(s, sce, overlap);
Rostislav Pehlivanov27d23ae2015-10-17 01:22:51664
665 if (s->options.ltp && s->coder->update_ltp) {
666 s->coder->update_ltp(s, sce);
667 apply_window[sce->ics.window_sequence[0]](s->fdsp, sce, &sce->ltp_state[0]);
668 s->mdct1024.mdct_calc(&s->mdct1024, sce->lcoeffs, sce->ret_buf);
669 }
670
Michael Niedermayer2cb8ede2016-01-20 14:05:38671 for (k = 0; k < 1024; k++) {
Michael Niedermayer77bf96b2016-08-23 09:00:29672 if (!(fabs(cpe->ch[ch].coeffs[k]) < 1E16)) { // Ensure headroom for energy calculation
673 av_log(avctx, AV_LOG_ERROR, "Input contains (near) NaN/+-Inf\n");
Michael Niedermayer2cb8ede2016-01-20 14:05:38674 return AVERROR(EINVAL);
675 }
Michael Niedermayerf9fa5602014-11-08 22:32:39676 }
Rostislav Pehlivanov2d9b5ae2015-10-17 01:13:00677 avoid_clipping(s, sce);
Alex Converse5962f6b2009-07-08 23:10:13678 }
679 start_ch += chans;
680 }
Andreas Rheinhardt56e9e022021-05-11 13:17:13681 if ((ret = ff_alloc_packet(avctx, avpkt, 8192 * s->channels)) < 0)
Reimar Döffingerecd74552012-04-06 13:25:05682 return ret;
Claudio Freire7ec74ae2015-09-23 05:13:56683 frame_bits = its = 0;
Alex Converse48d20c12009-07-08 23:12:53684 do {
Justin Rugglesad953072012-01-28 17:28:01685 init_put_bits(&s->pb, avpkt->data, avpkt->size);
686
Vittorio Giovara7c6eb0a2015-06-29 19:59:37687 if ((avctx->frame_number & 0xFF)==1 && !(avctx->flags & AV_CODEC_FLAG_BITEXACT))
Diego Biurrun72c758f2012-10-24 17:16:08688 put_bitstream_info(s, LIBAVCODEC_IDENT);
Alex Conversef11bfe32009-07-08 23:14:47689 start_ch = 0;
Claudio Freire7ec74ae2015-09-23 05:13:56690 target_bits = 0;
Alex Conversef11bfe32009-07-08 23:14:47691 memset(chan_el_counter, 0, sizeof(chan_el_counter));
Nathan Caldwell1bb52042011-06-20 04:29:37692 for (i = 0; i < s->chan_map[0]; i++) {
Alex Conversef11bfe32009-07-08 23:14:47693 FFPsyWindowInfo* wi = windows + start_ch;
Nathan Caldwell01344fe2011-05-19 05:14:59694 const float *coeffs[2];
Nathan Caldwell1bb52042011-06-20 04:29:37695 tag = s->chan_map[i+1];
Alex Conversef11bfe32009-07-08 23:14:47696 chans = tag == TYPE_CPE ? 2 : 1;
697 cpe = &s->cpe[i];
Rostislav Pehlivanova0079aa2015-09-01 06:00:10698 cpe->common_window = 0;
Rostislav Pehlivanov9f4f5782015-07-02 18:13:03699 memset(cpe->is_mask, 0, sizeof(cpe->is_mask));
700 memset(cpe->ms_mask, 0, sizeof(cpe->ms_mask));
Alex Converse8e4c11e2010-08-30 23:52:03701 put_bits(&s->pb, 3, tag);
702 put_bits(&s->pb, 4, chan_el_counter[tag]++);
Rostislav Pehlivanove6c9f3a2015-08-21 17:36:09703 for (ch = 0; ch < chans; ch++) {
704 sce = &cpe->ch[ch];
705 coeffs[ch] = sce->coeffs;
Rostislav Pehlivanov76b81b12015-08-21 18:38:05706 sce->ics.predictor_present = 0;
Rostislav Pehlivanov27d23ae2015-10-17 01:22:51707 sce->ics.ltp.present = 0;
708 memset(sce->ics.ltp.used, 0, sizeof(sce->ics.ltp.used));
Rostislav Pehlivanov3f3be1c2015-10-17 01:14:10709 memset(sce->ics.prediction_used, 0, sizeof(sce->ics.prediction_used));
Rostislav Pehlivanova1c487e2015-08-21 18:27:38710 memset(&sce->tns, 0, sizeof(TemporalNoiseShaping));
Rostislav Pehlivanove6c9f3a2015-08-21 17:36:09711 for (w = 0; w < 128; w++)
712 if (sce->band_type[w] > RESERVED_BT)
713 sce->band_type[w] = 0;
714 }
Claudio Freire7ec74ae2015-09-23 05:13:56715 s->psy.bitres.alloc = -1;
Rostislav Pehlivanov4386f172015-12-18 14:27:13716 s->psy.bitres.bits = s->last_frame_pb_count / s->channels;
Nathan Caldwelld3a6c2a2011-05-19 05:23:22717 s->psy.model->analyze(&s->psy, start_ch, coeffs, wi);
Claudio Freire7ec74ae2015-09-23 05:13:56718 if (s->psy.bitres.alloc > 0) {
719 /* Lambda unused here on purpose, we need to take psy's unscaled allocation */
Claudio Freire01ecb712015-10-11 20:29:50720 target_bits += s->psy.bitres.alloc
721 * (s->lambda / (avctx->global_quality ? avctx->global_quality : 120));
Claudio Freire7ec74ae2015-09-23 05:13:56722 s->psy.bitres.alloc /= chans;
723 }
724 s->cur_type = tag;
Nathan Caldwell5b29af62011-05-06 07:19:51725 for (ch = 0; ch < chans; ch++) {
Claudio Freiree41cd3c2013-05-12 07:38:40726 s->cur_channel = start_ch + ch;
Claudio Freire01ecb712015-10-11 20:29:50727 if (s->options.pns && s->coder->mark_pns)
728 s->coder->mark_pns(s, avctx, &cpe->ch[ch]);
Nathan Caldwell5b29af62011-05-06 07:19:51729 s->coder->search_for_quantizers(avctx, s, &cpe->ch[ch], s->lambda);
Alex Conversef11bfe32009-07-08 23:14:47730 }
Alex Conversef11bfe32009-07-08 23:14:47731 if (chans > 1
732 && wi[0].window_type[0] == wi[1].window_type[0]
733 && wi[0].window_shape == wi[1].window_shape) {
Alex Converse78e65cd2009-07-08 20:01:31734
Alex Conversef11bfe32009-07-08 23:14:47735 cpe->common_window = 1;
Nathan Caldwell5b29af62011-05-06 07:19:51736 for (w = 0; w < wi[0].num_windows; w++) {
737 if (wi[0].grouping[w] != wi[1].grouping[w]) {
Alex Conversef11bfe32009-07-08 23:14:47738 cpe->common_window = 0;
739 break;
740 }
Alex Converse78e65cd2009-07-08 20:01:31741 }
742 }
Rostislav Pehlivanov20dc5272015-09-02 05:26:45743 for (ch = 0; ch < chans; ch++) { /* TNS and PNS */
Rostislav Pehlivanova1c487e2015-08-21 18:27:38744 sce = &cpe->ch[ch];
745 s->cur_channel = start_ch + ch;
Rostislav Pehlivanova1c487e2015-08-21 18:27:38746 if (s->options.tns && s->coder->search_for_tns)
747 s->coder->search_for_tns(s, sce);
Rostislav Pehlivanovf20b6712015-08-29 05:47:31748 if (s->options.tns && s->coder->apply_tns_filt)
Rostislav Pehlivanovf3f6c6b2015-09-01 05:44:07749 s->coder->apply_tns_filt(s, sce);
Rostislav Pehlivanova1c487e2015-08-21 18:27:38750 if (sce->tns.present)
751 tns_mode = 1;
Rostislav Pehlivanovb32e9892015-12-06 13:32:40752 if (s->options.pns && s->coder->search_for_pns)
753 s->coder->search_for_pns(s, avctx, sce);
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05754 }
Claudio Freiree41cd3c2013-05-12 07:38:40755 s->cur_channel = start_ch;
Rostislav Pehlivanov20dc5272015-09-02 05:26:45756 if (s->options.intensity_stereo) { /* Intensity Stereo */
757 if (s->coder->search_for_is)
758 s->coder->search_for_is(s, avctx, cpe);
Rostislav Pehlivanove8576dc2015-07-02 18:13:07759 if (cpe->is_mode) is_mode = 1;
Rostislav Pehlivanov20dc5272015-09-02 05:26:45760 apply_intensity_stereo(cpe);
Rostislav Pehlivanove8576dc2015-07-02 18:13:07761 }
Rostislav Pehlivanov20dc5272015-09-02 05:26:45762 if (s->options.pred) { /* Prediction */
763 for (ch = 0; ch < chans; ch++) {
764 sce = &cpe->ch[ch];
765 s->cur_channel = start_ch + ch;
766 if (s->options.pred && s->coder->search_for_pred)
767 s->coder->search_for_pred(s, sce);
768 if (cpe->ch[ch].ics.predictor_present) pred_mode = 1;
769 }
Rostislav Pehlivanov93e6b232015-10-12 22:33:07770 if (s->coder->adjust_common_pred)
771 s->coder->adjust_common_pred(s, cpe);
Rostislav Pehlivanov20dc5272015-09-02 05:26:45772 for (ch = 0; ch < chans; ch++) {
773 sce = &cpe->ch[ch];
774 s->cur_channel = start_ch + ch;
775 if (s->options.pred && s->coder->apply_main_pred)
776 s->coder->apply_main_pred(s, sce);
777 }
778 s->cur_channel = start_ch;
779 }
Rostislav Pehlivanov0f4334d2015-10-12 15:50:10780 if (s->options.mid_side) { /* Mid/Side stereo */
781 if (s->options.mid_side == -1 && s->coder->search_for_ms)
Rostislav Pehlivanov20dc5272015-09-02 05:26:45782 s->coder->search_for_ms(s, cpe);
783 else if (cpe->common_window)
784 memset(cpe->ms_mask, 1, sizeof(cpe->ms_mask));
Rostislav Pehlivanov20dc5272015-09-02 05:26:45785 apply_mid_side_stereo(cpe);
786 }
Diego Biurrun72c758f2012-10-24 17:16:08787 adjust_frame_information(cpe, chans);
Rostislav Pehlivanov27d23ae2015-10-17 01:22:51788 if (s->options.ltp) { /* LTP */
789 for (ch = 0; ch < chans; ch++) {
790 sce = &cpe->ch[ch];
791 s->cur_channel = start_ch + ch;
792 if (s->coder->search_for_ltp)
793 s->coder->search_for_ltp(s, sce, cpe->common_window);
794 if (sce->ics.ltp.present) pred_mode = 1;
795 }
796 s->cur_channel = start_ch;
797 if (s->coder->adjust_common_ltp)
798 s->coder->adjust_common_ltp(s, cpe);
799 }
Alex Conversef11bfe32009-07-08 23:14:47800 if (chans == 2) {
801 put_bits(&s->pb, 1, cpe->common_window);
802 if (cpe->common_window) {
803 put_ics_info(s, &cpe->ch[0].ics);
Rostislav Pehlivanov76b81b12015-08-21 18:38:05804 if (s->coder->encode_main_pred)
805 s->coder->encode_main_pred(s, &cpe->ch[0]);
Rostislav Pehlivanov27d23ae2015-10-17 01:22:51806 if (s->coder->encode_ltp_info)
807 s->coder->encode_ltp_info(s, &cpe->ch[0], 1);
Alex Conversef11bfe32009-07-08 23:14:47808 encode_ms_info(&s->pb, cpe);
Claudio Freire6394aca2015-03-03 06:43:06809 if (cpe->ms_mode) ms_mode = 1;
Alex Conversef11bfe32009-07-08 23:14:47810 }
Alex Converse78e65cd2009-07-08 20:01:31811 }
Nathan Caldwell5b29af62011-05-06 07:19:51812 for (ch = 0; ch < chans; ch++) {
813 s->cur_channel = start_ch + ch;
814 encode_individual_channel(avctx, s, &cpe->ch[ch], cpe->common_window);
Alex Conversef11bfe32009-07-08 23:14:47815 }
816 start_ch += chans;
Alex Converse78e65cd2009-07-08 20:01:31817 }
Alex Converse78e65cd2009-07-08 20:01:31818
James Almerf5c8d002017-03-26 00:35:15819 if (avctx->flags & AV_CODEC_FLAG_QSCALE) {
Claudio Freire7ec74ae2015-09-23 05:13:56820 /* When using a constant Q-scale, don't mess with lambda */
Alex Converse48d20c12009-07-08 23:12:53821 break;
Nathan Caldwell230c1a92011-01-05 08:32:16822 }
Claudio Freire7ec74ae2015-09-23 05:13:56823
824 /* rate control stuff
Claudio Freire01ecb712015-10-11 20:29:50825 * allow between the nominal bitrate, and what psy's bit reservoir says to target
826 * but drift towards the nominal bitrate always
Claudio Freire7ec74ae2015-09-23 05:13:56827 */
Claudio Freire7ec74ae2015-09-23 05:13:56828 frame_bits = put_bits_count(&s->pb);
Claudio Freire01ecb712015-10-11 20:29:50829 rate_bits = avctx->bit_rate * 1024 / avctx->sample_rate;
830 rate_bits = FFMIN(rate_bits, 6144 * s->channels - 3);
831 too_many_bits = FFMAX(target_bits, rate_bits);
832 too_many_bits = FFMIN(too_many_bits, 6144 * s->channels - 3);
833 too_few_bits = FFMIN(FFMAX(rate_bits - rate_bits/4, target_bits), too_many_bits);
Claudio Freire7ec74ae2015-09-23 05:13:56834
835 /* When using ABR, be strict (but only for increasing) */
Claudio Freire01ecb712015-10-11 20:29:50836 too_few_bits = too_few_bits - too_few_bits/8;
837 too_many_bits = too_many_bits + too_many_bits/2;
Claudio Freire7ec74ae2015-09-23 05:13:56838
839 if ( its == 0 /* for steady-state Q-scale tracking */
840 || (its < 5 && (frame_bits < too_few_bits || frame_bits > too_many_bits))
841 || frame_bits >= 6144 * s->channels - 3 )
842 {
Claudio Freire01ecb712015-10-11 20:29:50843 float ratio = ((float)rate_bits) / frame_bits;
Claudio Freire7ec74ae2015-09-23 05:13:56844
845 if (frame_bits >= too_few_bits && frame_bits <= too_many_bits) {
846 /*
847 * This path is for steady-state Q-scale tracking
848 * When frame bits fall within the stable range, we still need to adjust
849 * lambda to maintain it like so in a stable fashion (large jumps in lambda
850 * create artifacts and should be avoided), but slowly
851 */
852 ratio = sqrtf(sqrtf(ratio));
853 ratio = av_clipf(ratio, 0.9f, 1.1f);
854 } else {
855 /* Not so fast though */
856 ratio = sqrtf(ratio);
Claudio Freire6394aca2015-03-03 06:43:06857 }
Michael Niedermayer4b89cf72021-06-01 08:07:05858 s->lambda = av_clipf(s->lambda * ratio, FLT_EPSILON, 65536.f);
Claudio Freire7ec74ae2015-09-23 05:13:56859
860 /* Keep iterating if we must reduce and lambda is in the sky */
Claudio Freireca203e92015-12-01 06:28:36861 if (ratio > 0.9f && ratio < 1.1f) {
Claudio Freire7ec74ae2015-09-23 05:13:56862 break;
863 } else {
864 if (is_mode || ms_mode || tns_mode || pred_mode) {
865 for (i = 0; i < s->chan_map[0]; i++) {
866 // Must restore coeffs
867 chans = tag == TYPE_CPE ? 2 : 1;
868 cpe = &s->cpe[i];
869 for (ch = 0; ch < chans; ch++)
870 memcpy(cpe->ch[ch].coeffs, cpe->ch[ch].pcoeffs, sizeof(cpe->ch[ch].coeffs));
871 }
872 }
873 its++;
874 }
875 } else {
876 break;
Claudio Freire6394aca2015-03-03 06:43:06877 }
Alex Converse48d20c12009-07-08 23:12:53878 } while (1);
879
Rostislav Pehlivanov27d23ae2015-10-17 01:22:51880 if (s->options.ltp && s->coder->ltp_insert_new_frame)
881 s->coder->ltp_insert_new_frame(s);
882
Alex Converse78e65cd2009-07-08 20:01:31883 put_bits(&s->pb, 3, TYPE_END);
884 flush_put_bits(&s->pb);
Hendrik Leppkes362028c2015-12-18 13:39:15885
Rostislav Pehlivanov4386f172015-12-18 14:27:13886 s->last_frame_pb_count = put_bits_count(&s->pb);
Andreas Rheinhardtc81b8e02021-03-25 11:52:56887 avpkt->size = put_bytes_output(&s->pb);
Alex Converse78e65cd2009-07-08 20:01:31888
Claudio Freire01ecb712015-10-11 20:29:50889 s->lambda_sum += s->lambda;
890 s->lambda_count++;
Alex Converse78e65cd2009-07-08 20:01:31891
Justin Rugglesad953072012-01-28 17:28:01892 ff_af_queue_remove(&s->afq, avctx->frame_size, &avpkt->pts,
893 &avpkt->duration);
894
Justin Rugglesad953072012-01-28 17:28:01895 *got_packet_ptr = 1;
896 return 0;
Alex Converse78e65cd2009-07-08 20:01:31897}
898
Kostya Shishkovc03d9d02008-08-14 05:52:29899static av_cold int aac_encode_end(AVCodecContext *avctx)
900{
901 AACEncContext *s = avctx->priv_data;
902
Michael Niedermayerc520b982021-05-29 15:49:22903 av_log(avctx, AV_LOG_INFO, "Qavg: %.3f\n", s->lambda_count ? s->lambda_sum / s->lambda_count : NAN);
Claudio Freire01ecb712015-10-11 20:29:50904
Kostya Shishkovc03d9d02008-08-14 05:52:29905 ff_mdct_end(&s->mdct1024);
906 ff_mdct_end(&s->mdct128);
Alex Converse78e65cd2009-07-08 20:01:31907 ff_psy_end(&s->psy);
Rostislav Pehlivanovb47a1e52015-08-21 17:43:09908 ff_lpc_end(&s->lpc);
Nathan Caldwell53107042011-12-15 02:50:23909 if (s->psypp)
910 ff_psy_preprocess_end(s->psypp);
Nathan Caldwell9b8e2a82011-12-15 02:43:56911 av_freep(&s->buffer.samples);
Kostya Shishkovc03d9d02008-08-14 05:52:29912 av_freep(&s->cpe);
Michael Niedermayer14285c32014-11-29 17:58:13913 av_freep(&s->fdsp);
Justin Rugglesad953072012-01-28 17:28:01914 ff_af_queue_close(&s->afq);
Kostya Shishkovc03d9d02008-08-14 05:52:29915 return 0;
916}
917
Nathan Caldwell53107042011-12-15 02:50:23918static av_cold int dsp_init(AVCodecContext *avctx, AACEncContext *s)
919{
920 int ret = 0;
921
Michael Niedermayer94d68a42015-07-27 19:14:31922 s->fdsp = avpriv_float_dsp_alloc(avctx->flags & AV_CODEC_FLAG_BITEXACT);
Michael Niedermayer14285c32014-11-29 17:58:13923 if (!s->fdsp)
924 return AVERROR(ENOMEM);
Nathan Caldwell53107042011-12-15 02:50:23925
926 // window init
Andreas Rheinhardt86b8c252020-11-22 22:33:03927 ff_aac_float_common_init();
Nathan Caldwell53107042011-12-15 02:50:23928
Michael Niedermayer3fb726c2015-05-16 17:07:31929 if ((ret = ff_mdct_init(&s->mdct1024, 11, 0, 32768.0)) < 0)
Nathan Caldwell53107042011-12-15 02:50:23930 return ret;
Michael Niedermayer3fb726c2015-05-16 17:07:31931 if ((ret = ff_mdct_init(&s->mdct128, 8, 0, 32768.0)) < 0)
Nathan Caldwell53107042011-12-15 02:50:23932 return ret;
933
934 return 0;
935}
936
937static av_cold int alloc_buffers(AVCodecContext *avctx, AACEncContext *s)
938{
Mans Rullgard3715d8412012-01-29 20:55:10939 int ch;
Limin Wangebf2a8a2020-06-01 14:48:28940 if (!FF_ALLOCZ_TYPED_ARRAY(s->buffer.samples, s->channels * 3 * 1024) ||
941 !FF_ALLOCZ_TYPED_ARRAY(s->cpe, s->chan_map[0]))
942 return AVERROR(ENOMEM);
Nathan Caldwell53107042011-12-15 02:50:23943
Mans Rullgard3715d8412012-01-29 20:55:10944 for(ch = 0; ch < s->channels; ch++)
Nathan Caldwell7946a5a2011-12-24 22:24:16945 s->planar_samples[ch] = s->buffer.samples + 3 * 1024 * ch;
Nathan Caldwell9b8e2a82011-12-15 02:43:56946
Nathan Caldwell53107042011-12-15 02:50:23947 return 0;
Nathan Caldwell53107042011-12-15 02:50:23948}
949
950static av_cold int aac_encode_init(AVCodecContext *avctx)
951{
952 AACEncContext *s = avctx->priv_data;
953 int i, ret = 0;
954 const uint8_t *sizes[2];
955 uint8_t grouping[AAC_MAX_CHANNELS];
956 int lengths[2];
957
Rostislav Pehlivanovf0a82122016-02-12 18:34:18958 /* Constants */
Rostislav Pehlivanov4386f172015-12-18 14:27:13959 s->last_frame_pb_count = 0;
Nathan Caldwell53107042011-12-15 02:50:23960 avctx->frame_size = 1024;
Rostislav Pehlivanov0f4334d2015-10-12 15:50:10961 avctx->initial_padding = 1024;
Rostislav Pehlivanovf0a82122016-02-12 18:34:18962 s->lambda = avctx->global_quality > 0 ? avctx->global_quality : 120;
Nathan Caldwell53107042011-12-15 02:50:23963
Rostislav Pehlivanovf0a82122016-02-12 18:34:18964 /* Channel map and unspecified bitrate guessing */
965 s->channels = avctx->channels;
Rostislav Pehlivanovfbf295e2016-10-03 18:53:11966
967 s->needs_pce = 1;
968 for (i = 0; i < FF_ARRAY_ELEMS(aac_normal_chan_layouts); i++) {
969 if (avctx->channel_layout == aac_normal_chan_layouts[i]) {
970 s->needs_pce = s->options.pce;
971 break;
972 }
973 }
974
975 if (s->needs_pce) {
Moritz Barsnick1693a682018-07-06 21:49:50976 char buf[64];
Rostislav Pehlivanovfbf295e2016-10-03 18:53:11977 for (i = 0; i < FF_ARRAY_ELEMS(aac_pce_configs); i++)
978 if (avctx->channel_layout == aac_pce_configs[i].layout)
979 break;
Moritz Barsnick1693a682018-07-06 21:49:50980 av_get_channel_layout_string(buf, sizeof(buf), -1, avctx->channel_layout);
981 ERROR_IF(i == FF_ARRAY_ELEMS(aac_pce_configs), "Unsupported channel layout \"%s\"\n", buf);
982 av_log(avctx, AV_LOG_INFO, "Using a PCE to encode channel layout \"%s\"\n", buf);
Rostislav Pehlivanovfbf295e2016-10-03 18:53:11983 s->pce = aac_pce_configs[i];
984 s->reorder_map = s->pce.reorder_map;
985 s->chan_map = s->pce.config_map;
986 } else {
987 s->reorder_map = aac_chan_maps[s->channels - 1];
988 s->chan_map = aac_chan_configs[s->channels - 1];
989 }
990
Rostislav Pehlivanovf0a82122016-02-12 18:34:18991 if (!avctx->bit_rate) {
992 for (i = 1; i <= s->chan_map[0]; i++) {
993 avctx->bit_rate += s->chan_map[i] == TYPE_CPE ? 128000 : /* Pair */
994 s->chan_map[i] == TYPE_LFE ? 16000 : /* LFE */
995 69000 ; /* SCE */
996 }
997 }
998
999 /* Samplerate */
Nathan Caldwell53107042011-12-15 02:50:231000 for (i = 0; i < 16; i++)
Andreas Rheinhardt49bf9452021-02-10 18:37:371001 if (avctx->sample_rate == ff_mpeg4audio_sample_rates[i])
Nathan Caldwell53107042011-12-15 02:50:231002 break;
Rostislav Pehlivanov0f4334d2015-10-12 15:50:101003 s->samplerate_index = i;
Rostislav Pehlivanov0f4334d2015-10-12 15:50:101004 ERROR_IF(s->samplerate_index == 16 ||
1005 s->samplerate_index >= ff_aac_swb_size_1024_len ||
1006 s->samplerate_index >= ff_aac_swb_size_128_len,
Nathan Caldwell53107042011-12-15 02:50:231007 "Unsupported sample rate %d\n", avctx->sample_rate);
Rostislav Pehlivanovf0a82122016-02-12 18:34:181008
1009 /* Bitrate limiting */
Claudio Freire6dbbb982015-03-06 07:05:321010 WARN_IF(1024.0 * avctx->bit_rate / avctx->sample_rate > 6144 * s->channels,
Hendrik Leppkes92186f22015-12-08 08:59:451011 "Too many bits %f > %d per frame requested, clamping to max\n",
Luca Barbatob8054822015-11-28 11:28:211012 1024.0 * avctx->bit_rate / avctx->sample_rate,
1013 6144 * s->channels);
Rostislav Pehlivanovf0a82122016-02-12 18:34:181014 avctx->bit_rate = (int64_t)FFMIN(6144 * s->channels / 1024.0 * avctx->sample_rate,
1015 avctx->bit_rate);
Claudio Freire6dbbb982015-03-06 07:05:321016
Rostislav Pehlivanovf0a82122016-02-12 18:34:181017 /* Profile and option setting */
1018 avctx->profile = avctx->profile == FF_PROFILE_UNKNOWN ? FF_PROFILE_AAC_LOW :
1019 avctx->profile;
Rostislav Pehlivanove9299df2015-10-17 02:15:441020 for (i = 0; i < FF_ARRAY_ELEMS(aacenc_profiles); i++)
1021 if (avctx->profile == aacenc_profiles[i])
Rostislav Pehlivanov0f4334d2015-10-12 15:50:101022 break;
Rostislav Pehlivanove9299df2015-10-17 02:15:441023 if (avctx->profile == FF_PROFILE_MPEG2_AAC_LOW) {
1024 avctx->profile = FF_PROFILE_AAC_LOW;
1025 ERROR_IF(s->options.pred,
1026 "Main prediction unavailable in the \"mpeg2_aac_low\" profile\n");
1027 ERROR_IF(s->options.ltp,
1028 "LTP prediction unavailable in the \"mpeg2_aac_low\" profile\n");
1029 WARN_IF(s->options.pns,
1030 "PNS unavailable in the \"mpeg2_aac_low\" profile, turning off\n");
1031 s->options.pns = 0;
1032 } else if (avctx->profile == FF_PROFILE_AAC_LTP) {
1033 s->options.ltp = 1;
1034 ERROR_IF(s->options.pred,
1035 "Main prediction unavailable in the \"aac_ltp\" profile\n");
1036 } else if (avctx->profile == FF_PROFILE_AAC_MAIN) {
1037 s->options.pred = 1;
1038 ERROR_IF(s->options.ltp,
1039 "LTP prediction unavailable in the \"aac_main\" profile\n");
1040 } else if (s->options.ltp) {
1041 avctx->profile = FF_PROFILE_AAC_LTP;
1042 WARN_IF(1,
1043 "Chainging profile to \"aac_ltp\"\n");
1044 ERROR_IF(s->options.pred,
1045 "Main prediction unavailable in the \"aac_ltp\" profile\n");
1046 } else if (s->options.pred) {
1047 avctx->profile = FF_PROFILE_AAC_MAIN;
1048 WARN_IF(1,
1049 "Chainging profile to \"aac_main\"\n");
Rostislav Pehlivanov31125012015-12-05 18:43:171050 ERROR_IF(s->options.ltp,
Rostislav Pehlivanove9299df2015-10-17 02:15:441051 "LTP prediction unavailable in the \"aac_main\" profile\n");
Rostislav Pehlivanov0f4334d2015-10-12 15:50:101052 }
Rostislav Pehlivanove9299df2015-10-17 02:15:441053 s->profile = avctx->profile;
Rostislav Pehlivanov0f4334d2015-10-12 15:50:101054
Rostislav Pehlivanovf0a82122016-02-12 18:34:181055 /* Coder limitations */
1056 s->coder = &ff_aac_coders[s->options.coder];
Rostislav Pehlivanovfb0abb32016-08-06 23:49:341057 if (s->options.coder == AAC_CODER_ANMR) {
Rostislav Pehlivanovb270ec92015-12-05 14:41:411058 ERROR_IF(avctx->strict_std_compliance > FF_COMPLIANCE_EXPERIMENTAL,
Rostislav Pehlivanov6612d042016-08-13 16:34:581059 "The ANMR coder is considered experimental, add -strict -2 to enable!\n");
Rostislav Pehlivanov8ffe1cb2015-09-01 11:07:001060 s->options.intensity_stereo = 0;
1061 s->options.pns = 0;
1062 }
Rostislav Pehlivanova72b1ea2016-01-20 16:49:551063 ERROR_IF(s->options.ltp && avctx->strict_std_compliance > FF_COMPLIANCE_EXPERIMENTAL,
1064 "The LPT profile requires experimental compliance, add -strict -2 to enable!\n");
1065
Rostislav Pehlivanov0fe0e212016-02-13 12:23:221066 /* M/S introduces horrible artifacts with multichannel files, this is temporary */
1067 if (s->channels > 3)
1068 s->options.mid_side = 0;
1069
Vittorio Giovara971099f2014-12-17 13:53:431070 if ((ret = dsp_init(avctx, s)) < 0)
Limin Wangebf2a8a2020-06-01 14:48:281071 return ret;
Nathan Caldwell53107042011-12-15 02:50:231072
Vittorio Giovara971099f2014-12-17 13:53:431073 if ((ret = alloc_buffers(avctx, s)) < 0)
Limin Wangebf2a8a2020-06-01 14:48:281074 return ret;
Nathan Caldwell53107042011-12-15 02:50:231075
Rostislav Pehlivanov7b7775a2017-11-09 04:30:071076 if ((ret = put_audio_specific_config(avctx)))
Limin Wangebf2a8a2020-06-01 14:48:281077 return ret;
Nathan Caldwell53107042011-12-15 02:50:231078
Rostislav Pehlivanov0f4334d2015-10-12 15:50:101079 sizes[0] = ff_aac_swb_size_1024[s->samplerate_index];
1080 sizes[1] = ff_aac_swb_size_128[s->samplerate_index];
1081 lengths[0] = ff_aac_num_swb_1024[s->samplerate_index];
1082 lengths[1] = ff_aac_num_swb_128[s->samplerate_index];
Nathan Caldwell53107042011-12-15 02:50:231083 for (i = 0; i < s->chan_map[0]; i++)
1084 grouping[i] = s->chan_map[i + 1] == TYPE_CPE;
Vittorio Giovara971099f2014-12-17 13:53:431085 if ((ret = ff_psy_init(&s->psy, avctx, 2, sizes, lengths,
1086 s->chan_map[0], grouping)) < 0)
Limin Wangebf2a8a2020-06-01 14:48:281087 return ret;
Nathan Caldwell53107042011-12-15 02:50:231088 s->psypp = ff_psy_preprocess_init(avctx);
Rostislav Pehlivanovd09f9c42015-09-01 05:40:121089 ff_lpc_init(&s->lpc, 2*avctx->frame_size, TNS_MAX_ORDER, FF_LPC_TYPE_LEVINSON);
Rostislav Pehlivanov230178d2016-10-08 00:47:041090 s->random_state = 0x1f2e3d4c;
Nathan Caldwell53107042011-12-15 02:50:231091
Rostislav Pehlivanovd2ae5f72016-10-08 14:59:141092 s->abs_pow34 = abs_pow34_v;
1093 s->quant_bands = quantize_bands;
1094
1095 if (ARCH_X86)
1096 ff_aac_dsp_init_x86(s);
1097
Vicente Olivert Rieraa27401a2015-12-03 13:22:161098 if (HAVE_MIPSDSP)
Bojan Zivkovic26f39242013-03-06 13:55:051099 ff_aac_coder_init_mips(s);
1100
Justin Rugglesad953072012-01-28 17:28:011101 ff_af_queue_init(avctx, &s->afq);
Andreas Rheinhardt195d8ce2020-11-19 15:54:451102 ff_aac_tableinit();
Justin Rugglesad953072012-01-28 17:28:011103
Nathan Caldwell53107042011-12-15 02:50:231104 return 0;
Nathan Caldwell53107042011-12-15 02:50:231105}
1106
Nathan Caldwellcc9947f2011-06-01 05:38:091107#define AACENC_FLAGS AV_OPT_FLAG_ENCODING_PARAM | AV_OPT_FLAG_AUDIO_PARAM
1108static const AVOption aacenc_options[] = {
Lynne660d1d82021-05-21 15:39:361109 {"aac_coder", "Coding algorithm", offsetof(AACEncContext, options.coder), AV_OPT_TYPE_INT, {.i64 = AAC_CODER_TWOLOOP}, 0, AAC_CODER_NB-1, AACENC_FLAGS, "coder"},
Rostislav Pehlivanov0f4334d2015-10-12 15:50:101110 {"anmr", "ANMR method", 0, AV_OPT_TYPE_CONST, {.i64 = AAC_CODER_ANMR}, INT_MIN, INT_MAX, AACENC_FLAGS, "coder"},
1111 {"twoloop", "Two loop searching method", 0, AV_OPT_TYPE_CONST, {.i64 = AAC_CODER_TWOLOOP}, INT_MIN, INT_MAX, AACENC_FLAGS, "coder"},
Rostislav Pehlivanovfcb681a2018-01-13 11:46:291112 {"fast", "Default fast search", 0, AV_OPT_TYPE_CONST, {.i64 = AAC_CODER_FAST}, INT_MIN, INT_MAX, AACENC_FLAGS, "coder"},
Rostislav Pehlivanov83900c02015-10-17 01:20:131113 {"aac_ms", "Force M/S stereo coding", offsetof(AACEncContext, options.mid_side), AV_OPT_TYPE_BOOL, {.i64 = -1}, -1, 1, AACENC_FLAGS},
Rostislav Pehlivanove9299df2015-10-17 02:15:441114 {"aac_is", "Intensity stereo coding", offsetof(AACEncContext, options.intensity_stereo), AV_OPT_TYPE_BOOL, {.i64 = 1}, -1, 1, AACENC_FLAGS},
1115 {"aac_pns", "Perceptual noise substitution", offsetof(AACEncContext, options.pns), AV_OPT_TYPE_BOOL, {.i64 = 1}, -1, 1, AACENC_FLAGS},
Rostislav Pehlivanovdfba1be2015-10-17 10:06:051116 {"aac_tns", "Temporal noise shaping", offsetof(AACEncContext, options.tns), AV_OPT_TYPE_BOOL, {.i64 = 1}, -1, 1, AACENC_FLAGS},
Rostislav Pehlivanove9299df2015-10-17 02:15:441117 {"aac_ltp", "Long term prediction", offsetof(AACEncContext, options.ltp), AV_OPT_TYPE_BOOL, {.i64 = 0}, -1, 1, AACENC_FLAGS},
1118 {"aac_pred", "AAC-Main prediction", offsetof(AACEncContext, options.pred), AV_OPT_TYPE_BOOL, {.i64 = 0}, -1, 1, AACENC_FLAGS},
Rostislav Pehlivanovfbf295e2016-10-03 18:53:111119 {"aac_pce", "Forces the use of PCEs", offsetof(AACEncContext, options.pce), AV_OPT_TYPE_BOOL, {.i64 = 0}, -1, 1, AACENC_FLAGS},
Marton Balintaee036c2020-05-10 18:38:111120 FF_AAC_PROFILE_OPTS
Nathan Caldwellcc9947f2011-06-01 05:38:091121 {NULL}
1122};
1123
1124static const AVClass aacenc_class = {
Diego Biurrun97cfe1d2017-06-10 14:45:061125 .class_name = "AAC encoder",
1126 .item_name = av_default_item_name,
1127 .option = aacenc_options,
1128 .version = LIBAVUTIL_VERSION_INT,
Nathan Caldwellcc9947f2011-06-01 05:38:091129};
1130
Rostislav Pehlivanovf0a82122016-02-12 18:34:181131static const AVCodecDefault aac_encode_defaults[] = {
1132 { "b", "0" },
1133 { NULL }
1134};
1135
Andreas Rheinhardta247ac62021-02-25 09:50:261136const AVCodec ff_aac_encoder = {
Anton Khirnovec6402b2011-07-17 10:54:311137 .name = "aac",
Diego Biurrunb2bed932013-10-03 20:57:531138 .long_name = NULL_IF_CONFIG_SMALL("AAC (Advanced Audio Coding)"),
Anton Khirnovec6402b2011-07-17 10:54:311139 .type = AVMEDIA_TYPE_AUDIO,
Anton Khirnov36ef5362012-08-05 09:11:041140 .id = AV_CODEC_ID_AAC,
Anton Khirnovec6402b2011-07-17 10:54:311141 .priv_data_size = sizeof(AACEncContext),
1142 .init = aac_encode_init,
Justin Rugglesad953072012-01-28 17:28:011143 .encode2 = aac_encode_frame,
Anton Khirnovec6402b2011-07-17 10:54:311144 .close = aac_encode_end,
Rostislav Pehlivanovf0a82122016-02-12 18:34:181145 .defaults = aac_encode_defaults,
Andreas Rheinhardt49bf9452021-02-10 18:37:371146 .supported_samplerates = ff_mpeg4audio_sample_rates,
Limin Wang17e88bf2020-06-01 14:29:131147 .caps_internal = FF_CODEC_CAP_INIT_THREADSAFE | FF_CODEC_CAP_INIT_CLEANUP,
Rostislav Pehlivanovd9791a82015-12-05 14:45:181148 .capabilities = AV_CODEC_CAP_SMALL_LAST_FRAME | AV_CODEC_CAP_DELAY,
Justin Rugglesf3e2d682012-08-25 17:04:331149 .sample_fmts = (const enum AVSampleFormat[]){ AV_SAMPLE_FMT_FLTP,
Martin Storsjö00c3b672012-04-06 16:19:391150 AV_SAMPLE_FMT_NONE },
Martin Storsjö00c3b672012-04-06 16:19:391151 .priv_class = &aacenc_class,
Kostya Shishkovc03d9d02008-08-14 05:52:291152};