blob: 96915c973196a3cec350d1956a6d903d2a197924 [file] [log] [blame]
Alex Converse78e65cd2009-07-08 20:01:311/*
2 * AAC coefficients encoder
3 * Copyright (C) 2008-2009 Konstantin Shishkov
4 *
5 * This file is part of FFmpeg.
6 *
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
11 *
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
16 *
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
20 */
21
22/**
Diego Biurrunba87f082010-04-20 14:45:3423 * @file
Alex Converse78e65cd2009-07-08 20:01:3124 * AAC coefficients encoder
25 */
26
27/***********************************
28 * TODOs:
29 * speedup quantizer selection
30 * add sane pulse detection
31 ***********************************/
32
Reinhard Tartler083e7152011-05-11 11:51:1133#include "libavutil/libm.h" // brought forward to work around cygwin header breakage
34
Alex Converse144c5e32010-05-25 18:28:1835#include <float.h>
Claudio Freire01ecb712015-10-11 20:29:5036
Mans Rullgard85770d62011-07-17 10:19:3537#include "libavutil/mathematics.h"
Claudio Freire01ecb712015-10-11 20:29:5038#include "mathops.h"
Alex Converse78e65cd2009-07-08 20:01:3139#include "avcodec.h"
40#include "put_bits.h"
41#include "aac.h"
42#include "aacenc.h"
43#include "aactab.h"
Rostislav Pehlivanovc47c7812015-07-29 04:44:2644#include "aacenctab.h"
Rostislav Pehlivanovef8e5a62015-07-29 04:44:2745#include "aacenc_utils.h"
Rostislav Pehlivanov43b378a2015-08-21 17:53:1446#include "aacenc_quantization.h"
Alex Converse78e65cd2009-07-08 20:01:3147
Rostislav Pehlivanovd1ca7142015-08-21 18:13:2648#include "aacenc_is.h"
Rostislav Pehlivanova1c487e2015-08-21 18:27:3849#include "aacenc_tns.h"
Rostislav Pehlivanovd1ca7142015-08-21 18:13:2650
Claudio Freire8df9bf82015-09-15 06:59:4551#include "libavcodec/aaccoder_twoloop.h"
52
Rostislav Pehlivanov033e5892015-09-06 14:13:1853/* Parameter of f(x) = a*(lambda/100), defines the maximum fourier spread
54 * beyond which no PNS is used (since the SFBs contain tone rather than noise) */
Claudio Freireca203e92015-12-01 06:28:3655#define NOISE_SPREAD_THRESHOLD 0.9f
Rostislav Pehlivanov38fd4c22015-07-02 18:13:0556
Rostislav Pehlivanov033e5892015-09-06 14:13:1857/* Parameter of f(x) = a*(100/lambda), defines how much PNS is allowed to
58 * replace low energy non zero bands */
59#define NOISE_LAMBDA_REPLACE 1.948f
Rostislav Pehlivanovc5d4f872015-04-15 11:18:4260
Claudio Freire8df9bf82015-09-15 06:59:4561#include "libavcodec/aaccoder_trellis.h"
62
Andreas Rheinhardt57d30522022-08-01 09:54:2563typedef float (*quantize_and_encode_band_func)(struct AACEncContext *s, PutBitContext *pb,
64 const float *in, float *quant, const float *scaled,
65 int size, int scale_idx, int cb,
66 const float lambda, const float uplim,
67 int *bits, float *energy);
68
69/**
70 * Calculate rate distortion cost for quantizing with given codebook
71 *
72 * @return quantization distortion
73 */
74static av_always_inline float quantize_and_encode_band_cost_template(
75 struct AACEncContext *s,
76 PutBitContext *pb, const float *in, float *out,
77 const float *scaled, int size, int scale_idx,
78 int cb, const float lambda, const float uplim,
79 int *bits, float *energy, int BT_ZERO, int BT_UNSIGNED,
80 int BT_PAIR, int BT_ESC, int BT_NOISE, int BT_STEREO,
81 const float ROUNDING)
82{
83 const int q_idx = POW_SF2_ZERO - scale_idx + SCALE_ONE_POS - SCALE_DIV_512;
84 const float Q = ff_aac_pow2sf_tab [q_idx];
85 const float Q34 = ff_aac_pow34sf_tab[q_idx];
86 const float IQ = ff_aac_pow2sf_tab [POW_SF2_ZERO + scale_idx - SCALE_ONE_POS + SCALE_DIV_512];
87 const float CLIPPED_ESCAPE = 165140.0f*IQ;
88 float cost = 0;
89 float qenergy = 0;
90 const int dim = BT_PAIR ? 2 : 4;
91 int resbits = 0;
92 int off;
93
94 if (BT_ZERO || BT_NOISE || BT_STEREO) {
95 for (int i = 0; i < size; i++)
96 cost += in[i]*in[i];
97 if (bits)
98 *bits = 0;
99 if (energy)
100 *energy = qenergy;
101 if (out) {
102 for (int i = 0; i < size; i += dim)
103 for (int j = 0; j < dim; j++)
104 out[i+j] = 0.0f;
105 }
106 return cost * lambda;
107 }
108 if (!scaled) {
Andreas Rheinhardt88b3b092024-02-28 12:29:19109 s->aacdsp.abs_pow34(s->scoefs, in, size);
Andreas Rheinhardt57d30522022-08-01 09:54:25110 scaled = s->scoefs;
111 }
Andreas Rheinhardt88b3b092024-02-28 12:29:19112 s->aacdsp.quant_bands(s->qcoefs, in, scaled, size, !BT_UNSIGNED, aac_cb_maxval[cb], Q34, ROUNDING);
Andreas Rheinhardt57d30522022-08-01 09:54:25113 if (BT_UNSIGNED) {
114 off = 0;
115 } else {
116 off = aac_cb_maxval[cb];
117 }
118 for (int i = 0; i < size; i += dim) {
119 const float *vec;
120 int *quants = s->qcoefs + i;
121 int curidx = 0;
122 int curbits;
123 float quantized, rd = 0.0f;
124 for (int j = 0; j < dim; j++) {
125 curidx *= aac_cb_range[cb];
126 curidx += quants[j] + off;
127 }
128 curbits = ff_aac_spectral_bits[cb-1][curidx];
129 vec = &ff_aac_codebook_vectors[cb-1][curidx*dim];
130 if (BT_UNSIGNED) {
131 for (int j = 0; j < dim; j++) {
132 float t = fabsf(in[i+j]);
133 float di;
134 if (BT_ESC && vec[j] == 64.0f) { //FIXME: slow
135 if (t >= CLIPPED_ESCAPE) {
136 quantized = CLIPPED_ESCAPE;
137 curbits += 21;
138 } else {
139 int c = av_clip_uintp2(quant(t, Q, ROUNDING), 13);
140 quantized = c*cbrtf(c)*IQ;
141 curbits += av_log2(c)*2 - 4 + 1;
142 }
143 } else {
144 quantized = vec[j]*IQ;
145 }
146 di = t - quantized;
147 if (out)
148 out[i+j] = in[i+j] >= 0 ? quantized : -quantized;
149 if (vec[j] != 0.0f)
150 curbits++;
151 qenergy += quantized*quantized;
152 rd += di*di;
153 }
154 } else {
155 for (int j = 0; j < dim; j++) {
156 quantized = vec[j]*IQ;
157 qenergy += quantized*quantized;
158 if (out)
159 out[i+j] = quantized;
160 rd += (in[i+j] - quantized)*(in[i+j] - quantized);
161 }
162 }
163 cost += rd * lambda + curbits;
164 resbits += curbits;
165 if (cost >= uplim)
166 return uplim;
167 if (pb) {
168 put_bits(pb, ff_aac_spectral_bits[cb-1][curidx], ff_aac_spectral_codes[cb-1][curidx]);
169 if (BT_UNSIGNED)
170 for (int j = 0; j < dim; j++)
171 if (ff_aac_codebook_vectors[cb-1][curidx*dim+j] != 0.0f)
172 put_bits(pb, 1, in[i+j] < 0.0f);
173 if (BT_ESC) {
174 for (int j = 0; j < 2; j++) {
175 if (ff_aac_codebook_vectors[cb-1][curidx*2+j] == 64.0f) {
176 int coef = av_clip_uintp2(quant(fabsf(in[i+j]), Q, ROUNDING), 13);
177 int len = av_log2(coef);
178
179 put_bits(pb, len - 4 + 1, (1 << (len - 4 + 1)) - 2);
180 put_sbits(pb, len, coef);
181 }
182 }
183 }
184 }
185 }
186
187 if (bits)
188 *bits = resbits;
189 if (energy)
190 *energy = qenergy;
191 return cost;
192}
193
194static inline float quantize_and_encode_band_cost_NONE(struct AACEncContext *s, PutBitContext *pb,
195 const float *in, float *quant, const float *scaled,
196 int size, int scale_idx, int cb,
197 const float lambda, const float uplim,
198 int *bits, float *energy) {
199 av_assert0(0);
200 return 0.0f;
201}
202
203#define QUANTIZE_AND_ENCODE_BAND_COST_FUNC(NAME, BT_ZERO, BT_UNSIGNED, BT_PAIR, BT_ESC, BT_NOISE, BT_STEREO, ROUNDING) \
204static float quantize_and_encode_band_cost_ ## NAME( \
205 struct AACEncContext *s, \
206 PutBitContext *pb, const float *in, float *quant, \
207 const float *scaled, int size, int scale_idx, \
208 int cb, const float lambda, const float uplim, \
209 int *bits, float *energy) { \
210 return quantize_and_encode_band_cost_template( \
211 s, pb, in, quant, scaled, size, scale_idx, \
212 BT_ESC ? ESC_BT : cb, lambda, uplim, bits, energy, \
213 BT_ZERO, BT_UNSIGNED, BT_PAIR, BT_ESC, BT_NOISE, BT_STEREO, \
214 ROUNDING); \
215}
216
217QUANTIZE_AND_ENCODE_BAND_COST_FUNC(ZERO, 1, 0, 0, 0, 0, 0, ROUND_STANDARD)
218QUANTIZE_AND_ENCODE_BAND_COST_FUNC(SQUAD, 0, 0, 0, 0, 0, 0, ROUND_STANDARD)
219QUANTIZE_AND_ENCODE_BAND_COST_FUNC(UQUAD, 0, 1, 0, 0, 0, 0, ROUND_STANDARD)
220QUANTIZE_AND_ENCODE_BAND_COST_FUNC(SPAIR, 0, 0, 1, 0, 0, 0, ROUND_STANDARD)
221QUANTIZE_AND_ENCODE_BAND_COST_FUNC(UPAIR, 0, 1, 1, 0, 0, 0, ROUND_STANDARD)
222QUANTIZE_AND_ENCODE_BAND_COST_FUNC(ESC, 0, 1, 1, 1, 0, 0, ROUND_STANDARD)
223QUANTIZE_AND_ENCODE_BAND_COST_FUNC(ESC_RTZ, 0, 1, 1, 1, 0, 0, ROUND_TO_ZERO)
224QUANTIZE_AND_ENCODE_BAND_COST_FUNC(NOISE, 0, 0, 0, 0, 1, 0, ROUND_STANDARD)
225QUANTIZE_AND_ENCODE_BAND_COST_FUNC(STEREO,0, 0, 0, 0, 0, 1, ROUND_STANDARD)
226
Andreas Rheinhardtb71e2e42022-10-22 12:02:50227static const quantize_and_encode_band_func quantize_and_encode_band_cost_arr[] =
Andreas Rheinhardt57d30522022-08-01 09:54:25228{
229 quantize_and_encode_band_cost_ZERO,
230 quantize_and_encode_band_cost_SQUAD,
231 quantize_and_encode_band_cost_SQUAD,
232 quantize_and_encode_band_cost_UQUAD,
233 quantize_and_encode_band_cost_UQUAD,
234 quantize_and_encode_band_cost_SPAIR,
235 quantize_and_encode_band_cost_SPAIR,
236 quantize_and_encode_band_cost_UPAIR,
237 quantize_and_encode_band_cost_UPAIR,
238 quantize_and_encode_band_cost_UPAIR,
239 quantize_and_encode_band_cost_UPAIR,
240 quantize_and_encode_band_cost_ESC,
241 quantize_and_encode_band_cost_NONE, /* CB 12 doesn't exist */
242 quantize_and_encode_band_cost_NOISE,
243 quantize_and_encode_band_cost_STEREO,
244 quantize_and_encode_band_cost_STEREO,
245};
246
Andreas Rheinhardtb71e2e42022-10-22 12:02:50247static const quantize_and_encode_band_func quantize_and_encode_band_cost_rtz_arr[] =
Andreas Rheinhardt57d30522022-08-01 09:54:25248{
249 quantize_and_encode_band_cost_ZERO,
250 quantize_and_encode_band_cost_SQUAD,
251 quantize_and_encode_band_cost_SQUAD,
252 quantize_and_encode_band_cost_UQUAD,
253 quantize_and_encode_band_cost_UQUAD,
254 quantize_and_encode_band_cost_SPAIR,
255 quantize_and_encode_band_cost_SPAIR,
256 quantize_and_encode_band_cost_UPAIR,
257 quantize_and_encode_band_cost_UPAIR,
258 quantize_and_encode_band_cost_UPAIR,
259 quantize_and_encode_band_cost_UPAIR,
260 quantize_and_encode_band_cost_ESC_RTZ,
261 quantize_and_encode_band_cost_NONE, /* CB 12 doesn't exist */
262 quantize_and_encode_band_cost_NOISE,
263 quantize_and_encode_band_cost_STEREO,
264 quantize_and_encode_band_cost_STEREO,
265};
266
267float ff_quantize_and_encode_band_cost(struct AACEncContext *s, PutBitContext *pb,
268 const float *in, float *quant, const float *scaled,
269 int size, int scale_idx, int cb,
270 const float lambda, const float uplim,
271 int *bits, float *energy)
272{
273 return quantize_and_encode_band_cost_arr[cb](s, pb, in, quant, scaled, size,
274 scale_idx, cb, lambda, uplim,
275 bits, energy);
276}
277
278static inline void quantize_and_encode_band(struct AACEncContext *s, PutBitContext *pb,
279 const float *in, float *out, int size, int scale_idx,
280 int cb, const float lambda, int rtz)
281{
282 (rtz ? quantize_and_encode_band_cost_rtz_arr : quantize_and_encode_band_cost_arr)[cb](s, pb, in, out, NULL, size, scale_idx, cb,
283 lambda, INFINITY, NULL, NULL);
284}
285
Alex Converse78e65cd2009-07-08 20:01:31286/**
287 * structure used in optimal codebook search
288 */
289typedef struct BandCodingPath {
290 int prev_idx; ///< pointer to the previous path point
Alex Converse78e65cd2009-07-08 20:01:31291 float cost; ///< path cost
292 int run;
293} BandCodingPath;
294
Alex Converse78e65cd2009-07-08 20:01:31295typedef struct TrellisPath {
296 float cost;
297 int prev;
Alex Converse78e65cd2009-07-08 20:01:31298} TrellisPath;
299
Alex Conversef5e82fe2009-09-21 04:32:51300#define TRELLIS_STAGES 121
Alex Converse144c5e32010-05-25 18:28:18301#define TRELLIS_STATES (SCALE_MAX_DIFF+1)
Alex Conversef5e82fe2009-09-21 04:32:51302
Rostislav Pehlivanov7c10b872015-06-26 20:16:34303static void set_special_band_scalefactors(AACEncContext *s, SingleChannelElement *sce)
304{
Claudio Freire60a76f82016-01-16 23:44:36305 int w, g;
306 int prevscaler_n = -255, prevscaler_i = 0;
Rostislav Pehlivanov7c10b872015-06-26 20:16:34307 int bands = 0;
308
309 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Rostislav Pehlivanov6612d042016-08-13 16:34:58310 for (g = 0; g < sce->ics.num_swb; g++) {
Claudio Freire60a76f82016-01-16 23:44:36311 if (sce->zeroes[w*16+g])
312 continue;
Rostislav Pehlivanov7c10b872015-06-26 20:16:34313 if (sce->band_type[w*16+g] == INTENSITY_BT || sce->band_type[w*16+g] == INTENSITY_BT2) {
Rostislav Pehlivanovb9b1fd12015-09-06 14:07:29314 sce->sf_idx[w*16+g] = av_clip(roundf(log2f(sce->is_ener[w*16+g])*2), -155, 100);
Rostislav Pehlivanov7c10b872015-06-26 20:16:34315 bands++;
316 } else if (sce->band_type[w*16+g] == NOISE_BT) {
Rostislav Pehlivanovda64bd62015-09-09 09:44:33317 sce->sf_idx[w*16+g] = av_clip(3+ceilf(log2f(sce->pns_ener[w*16+g])*2), -100, 155);
Claudio Freire60a76f82016-01-16 23:44:36318 if (prevscaler_n == -255)
319 prevscaler_n = sce->sf_idx[w*16+g];
Rostislav Pehlivanov7c10b872015-06-26 20:16:34320 bands++;
321 }
Rostislav Pehlivanov7c10b872015-06-26 20:16:34322 }
323 }
324
325 if (!bands)
326 return;
327
328 /* Clip the scalefactor indices */
329 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Rostislav Pehlivanov6612d042016-08-13 16:34:58330 for (g = 0; g < sce->ics.num_swb; g++) {
Claudio Freire60a76f82016-01-16 23:44:36331 if (sce->zeroes[w*16+g])
332 continue;
Rostislav Pehlivanov7c10b872015-06-26 20:16:34333 if (sce->band_type[w*16+g] == INTENSITY_BT || sce->band_type[w*16+g] == INTENSITY_BT2) {
Claudio Freire60a76f82016-01-16 23:44:36334 sce->sf_idx[w*16+g] = prevscaler_i = av_clip(sce->sf_idx[w*16+g], prevscaler_i - SCALE_MAX_DIFF, prevscaler_i + SCALE_MAX_DIFF);
Rostislav Pehlivanov7c10b872015-06-26 20:16:34335 } else if (sce->band_type[w*16+g] == NOISE_BT) {
Claudio Freire60a76f82016-01-16 23:44:36336 sce->sf_idx[w*16+g] = prevscaler_n = av_clip(sce->sf_idx[w*16+g], prevscaler_n - SCALE_MAX_DIFF, prevscaler_n + SCALE_MAX_DIFF);
Rostislav Pehlivanov7c10b872015-06-26 20:16:34337 }
338 }
339 }
340}
341
Alex Converse78e65cd2009-07-08 20:01:31342static void search_for_quantizers_fast(AVCodecContext *avctx, AACEncContext *s,
Diego Biurrun99d61d32009-07-08 21:16:06343 SingleChannelElement *sce,
344 const float lambda)
Alex Converse78e65cd2009-07-08 20:01:31345{
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31346 int start = 0, i, w, w2, g;
Anton Khirnov494760f2013-05-07 05:20:32347 int destbits = avctx->bit_rate * 1024.0 / avctx->sample_rate / avctx->ch_layout.nb_channels * (lambda / 120.f);
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31348 float dists[128] = { 0 }, uplims[128] = { 0 };
349 float maxvals[128];
350 int fflag, minscaler;
351 int its = 0;
352 int allz = 0;
353 float minthr = INFINITY;
Alex Converse78e65cd2009-07-08 20:01:31354
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31355 // for values above this the decoder might end up in an endless loop
356 // due to always having more bits than what can be encoded.
357 destbits = FFMIN(destbits, 5800);
Rostislav Pehlivanov6612d042016-08-13 16:34:58358 //some heuristic to determine initial quantizers will reduce search time
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31359 //determine zero bands and upper limits
Alex Conversefd257dc2009-07-08 20:36:45360 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31361 start = 0;
Rostislav Pehlivanov6612d042016-08-13 16:34:58362 for (g = 0; g < sce->ics.num_swb; g++) {
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31363 int nz = 0;
Andreas Rheinhardt01d158d2021-12-01 14:22:05364 float uplim = 0.0f;
Alex Conversefd257dc2009-07-08 20:36:45365 for (w2 = 0; w2 < sce->ics.group_len[w]; w2++) {
Nathan Caldwell0bc01cc2011-06-15 08:50:25366 FFPsyBand *band = &s->psy.ch[s->cur_channel].psy_bands[(w+w2)*16+g];
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31367 uplim += band->threshold;
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31368 if (band->energy <= band->threshold || band->threshold == 0.0f) {
Alex Converse78e65cd2009-07-08 20:01:31369 sce->zeroes[(w+w2)*16+g] = 1;
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31370 continue;
Alex Converse78e65cd2009-07-08 20:01:31371 }
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31372 nz = 1;
Alex Converse78e65cd2009-07-08 20:01:31373 }
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31374 uplims[w*16+g] = uplim *512;
375 sce->band_type[w*16+g] = 0;
376 sce->zeroes[w*16+g] = !nz;
377 if (nz)
378 minthr = FFMIN(minthr, uplim);
379 allz |= nz;
380 start += sce->ics.swb_sizes[g];
Alex Converse78e65cd2009-07-08 20:01:31381 }
382 }
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31383 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Rostislav Pehlivanov6612d042016-08-13 16:34:58384 for (g = 0; g < sce->ics.num_swb; g++) {
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31385 if (sce->zeroes[w*16+g]) {
386 sce->sf_idx[w*16+g] = SCALE_ONE_POS;
387 continue;
388 }
389 sce->sf_idx[w*16+g] = SCALE_ONE_POS + FFMIN(log2f(uplims[w*16+g]/minthr)*4,59);
390 }
Alex Converse78e65cd2009-07-08 20:01:31391 }
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31392
393 if (!allz)
394 return;
Andreas Rheinhardt88b3b092024-02-28 12:29:19395 s->aacdsp.abs_pow34(s->scoefs, sce->coeffs, 1024);
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31396 ff_quantize_band_cost_cache_init(s);
397
398 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
399 start = w*128;
Rostislav Pehlivanov6612d042016-08-13 16:34:58400 for (g = 0; g < sce->ics.num_swb; g++) {
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31401 const float *scaled = s->scoefs + start;
402 maxvals[w*16+g] = find_max_val(sce->ics.group_len[w], sce->ics.swb_sizes[g], scaled);
403 start += sce->ics.swb_sizes[g];
404 }
405 }
406
407 //perform two-loop search
408 //outer loop - improve quality
409 do {
410 int tbits, qstep;
411 minscaler = sce->sf_idx[0];
412 //inner loop - quantize spectrum to fit into given number of bits
413 qstep = its ? 1 : 32;
414 do {
415 int prev = -1;
416 tbits = 0;
417 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
418 start = w*128;
Rostislav Pehlivanov6612d042016-08-13 16:34:58419 for (g = 0; g < sce->ics.num_swb; g++) {
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31420 const float *coefs = sce->coeffs + start;
421 const float *scaled = s->scoefs + start;
422 int bits = 0;
423 int cb;
424 float dist = 0.0f;
425
426 if (sce->zeroes[w*16+g] || sce->sf_idx[w*16+g] >= 218) {
427 start += sce->ics.swb_sizes[g];
428 continue;
429 }
430 minscaler = FFMIN(minscaler, sce->sf_idx[w*16+g]);
431 cb = find_min_book(maxvals[w*16+g], sce->sf_idx[w*16+g]);
432 for (w2 = 0; w2 < sce->ics.group_len[w]; w2++) {
433 int b;
434 dist += quantize_band_cost_cached(s, w + w2, g,
435 coefs + w2*128,
436 scaled + w2*128,
437 sce->ics.swb_sizes[g],
438 sce->sf_idx[w*16+g],
439 cb, 1.0f, INFINITY,
440 &b, NULL, 0);
441 bits += b;
442 }
443 dists[w*16+g] = dist - bits;
444 if (prev != -1) {
445 bits += ff_aac_scalefactor_bits[sce->sf_idx[w*16+g] - prev + SCALE_DIFF_ZERO];
446 }
447 tbits += bits;
448 start += sce->ics.swb_sizes[g];
449 prev = sce->sf_idx[w*16+g];
450 }
451 }
452 if (tbits > destbits) {
453 for (i = 0; i < 128; i++)
454 if (sce->sf_idx[i] < 218 - qstep)
455 sce->sf_idx[i] += qstep;
456 } else {
457 for (i = 0; i < 128; i++)
458 if (sce->sf_idx[i] > 60 - qstep)
459 sce->sf_idx[i] -= qstep;
460 }
461 qstep >>= 1;
462 if (!qstep && tbits > destbits*1.02 && sce->sf_idx[0] < 217)
463 qstep = 1;
464 } while (qstep);
465
466 fflag = 0;
467 minscaler = av_clip(minscaler, 60, 255 - SCALE_MAX_DIFF);
468
469 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
470 for (g = 0; g < sce->ics.num_swb; g++) {
471 int prevsc = sce->sf_idx[w*16+g];
472 if (dists[w*16+g] > uplims[w*16+g] && sce->sf_idx[w*16+g] > 60) {
473 if (find_min_book(maxvals[w*16+g], sce->sf_idx[w*16+g]-1))
474 sce->sf_idx[w*16+g]--;
475 else //Try to make sure there is some energy in every band
476 sce->sf_idx[w*16+g]-=2;
477 }
478 sce->sf_idx[w*16+g] = av_clip(sce->sf_idx[w*16+g], minscaler, minscaler + SCALE_MAX_DIFF);
479 sce->sf_idx[w*16+g] = FFMIN(sce->sf_idx[w*16+g], 219);
480 if (sce->sf_idx[w*16+g] != prevsc)
481 fflag = 1;
482 sce->band_type[w*16+g] = find_min_book(maxvals[w*16+g], sce->sf_idx[w*16+g]);
483 }
484 }
485 its++;
486 } while (fflag && its < 10);
Alex Converse78e65cd2009-07-08 20:01:31487}
488
Rostislav Pehlivanov6d175152015-07-29 04:44:24489static void search_for_pns(AACEncContext *s, AVCodecContext *avctx, SingleChannelElement *sce)
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05490{
Rostislav Pehlivanov033e5892015-09-06 14:13:18491 FFPsyBand *band;
Rostislav Pehlivanovda64bd62015-09-09 09:44:33492 int w, g, w2, i;
Claudio Freire01ecb712015-10-11 20:29:50493 int wlen = 1024 / sce->ics.num_windows;
494 int bandwidth, cutoff;
Rostislav Pehlivanov033e5892015-09-06 14:13:18495 float *PNS = &s->scoefs[0*128], *PNS34 = &s->scoefs[1*128];
496 float *NOR34 = &s->scoefs[3*128];
Claudio Freireca203e92015-12-01 06:28:36497 uint8_t nextband[128];
Rostislav Pehlivanov6d175152015-07-29 04:44:24498 const float lambda = s->lambda;
Claudio Freire01ecb712015-10-11 20:29:50499 const float freq_mult = avctx->sample_rate*0.5f/wlen;
Rostislav Pehlivanov033e5892015-09-06 14:13:18500 const float thr_mult = NOISE_LAMBDA_REPLACE*(100.0f/lambda);
Claudio Freire01ecb712015-10-11 20:29:50501 const float spread_threshold = FFMIN(0.75f, NOISE_SPREAD_THRESHOLD*FFMAX(0.5f, lambda/100.f));
502 const float dist_bias = av_clipf(4.f * 120 / lambda, 0.25f, 4.0f);
503 const float pns_transient_energy_r = FFMIN(0.7f, lambda / 140.f);
504
505 int refbits = avctx->bit_rate * 1024.0 / avctx->sample_rate
Anton Khirnov494760f2013-05-07 05:20:32506 / ((avctx->flags & AV_CODEC_FLAG_QSCALE) ? 2.0f : avctx->ch_layout.nb_channels)
Claudio Freire01ecb712015-10-11 20:29:50507 * (lambda / 120.f);
508
509 /** Keep this in sync with twoloop's cutoff selection */
510 float rate_bandwidth_multiplier = 1.5f;
Claudio Freireca203e92015-12-01 06:28:36511 int prev = -1000, prev_sf = -1;
James Almerf5c8d002017-03-26 00:35:15512 int frame_bit_rate = (avctx->flags & AV_CODEC_FLAG_QSCALE)
Claudio Freire01ecb712015-10-11 20:29:50513 ? (refbits * rate_bandwidth_multiplier * avctx->sample_rate / 1024)
Anton Khirnov494760f2013-05-07 05:20:32514 : (avctx->bit_rate / avctx->ch_layout.nb_channels);
Claudio Freire01ecb712015-10-11 20:29:50515
516 frame_bit_rate *= 1.15f;
517
518 if (avctx->cutoff > 0) {
519 bandwidth = avctx->cutoff;
520 } else {
521 bandwidth = FFMAX(3000, AAC_CUTOFF_FROM_BITRATE(frame_bit_rate, 1, avctx->sample_rate));
522 }
523
524 cutoff = bandwidth * 2 * wlen / avctx->sample_rate;
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05525
Claudio Freire9458a622015-09-25 06:56:32526 memcpy(sce->band_alt, sce->band_type, sizeof(sce->band_type));
Claudio Freireca203e92015-12-01 06:28:36527 ff_init_nextband_map(sce, nextband);
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05528 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Claudio Freire0f98fd32015-09-26 07:49:16529 int wstart = w*128;
Rostislav Pehlivanov6612d042016-08-13 16:34:58530 for (g = 0; g < sce->ics.num_swb; g++) {
Rostislav Pehlivanovda64bd62015-09-09 09:44:33531 int noise_sfi;
Rostislav Pehlivanov033e5892015-09-06 14:13:18532 float dist1 = 0.0f, dist2 = 0.0f, noise_amp;
Claudio Freire9458a622015-09-25 06:56:32533 float pns_energy = 0.0f, pns_tgt_energy, energy_ratio, dist_thresh;
Claudio Freire01ecb712015-10-11 20:29:50534 float sfb_energy = 0.0f, threshold = 0.0f, spread = 2.0f;
535 float min_energy = -1.0f, max_energy = 0.0f;
Claudio Freire0f98fd32015-09-26 07:49:16536 const int start = wstart+sce->ics.swb_offset[g];
Claudio Freire9458a622015-09-25 06:56:32537 const float freq = (start-wstart)*freq_mult;
Rostislav Pehlivanovda64bd62015-09-09 09:44:33538 const float freq_boost = FFMAX(0.88f*freq/NOISE_LOW_LIMIT, 1.0f);
Claudio Freire00d481b2016-01-08 07:39:02539 if (freq < NOISE_LOW_LIMIT || (start-wstart) >= cutoff) {
540 if (!sce->zeroes[w*16+g])
541 prev_sf = sce->sf_idx[w*16+g];
Rostislav Pehlivanov033e5892015-09-06 14:13:18542 continue;
Claudio Freire00d481b2016-01-08 07:39:02543 }
Rostislav Pehlivanov033e5892015-09-06 14:13:18544 for (w2 = 0; w2 < sce->ics.group_len[w]; w2++) {
545 band = &s->psy.ch[s->cur_channel].psy_bands[(w+w2)*16+g];
Rostislav Pehlivanovb6cc8ec2015-09-07 11:39:04546 sfb_energy += band->energy;
Claudio Freire01ecb712015-10-11 20:29:50547 spread = FFMIN(spread, band->spread);
Rostislav Pehlivanovb6cc8ec2015-09-07 11:39:04548 threshold += band->threshold;
Claudio Freire01ecb712015-10-11 20:29:50549 if (!w2) {
550 min_energy = max_energy = band->energy;
551 } else {
552 min_energy = FFMIN(min_energy, band->energy);
553 max_energy = FFMAX(max_energy, band->energy);
554 }
Rostislav Pehlivanov033e5892015-09-06 14:13:18555 }
Rostislav Pehlivanov033e5892015-09-06 14:13:18556
Rostislav Pehlivanovda64bd62015-09-09 09:44:33557 /* Ramps down at ~8000Hz and loosens the dist threshold */
Claudio Freire01ecb712015-10-11 20:29:50558 dist_thresh = av_clipf(2.5f*NOISE_LOW_LIMIT/freq, 0.5f, 2.5f) * dist_bias;
Rostislav Pehlivanov033e5892015-09-06 14:13:18559
Claudio Freire01ecb712015-10-11 20:29:50560 /* PNS is acceptable when all of these are true:
561 * 1. high spread energy (noise-like band)
562 * 2. near-threshold energy (high PE means the random nature of PNS content will be noticed)
563 * 3. on short window groups, all windows have similar energy (variations in energy would be destroyed by PNS)
564 *
565 * At this stage, point 2 is relaxed for zeroed bands near the noise threshold (hole avoidance is more important)
Claudio Freire9458a622015-09-25 06:56:32566 */
Claudio Freireca203e92015-12-01 06:28:36567 if ((!sce->zeroes[w*16+g] && !ff_sfdelta_can_remove_band(sce, nextband, prev_sf, w*16+g)) ||
568 ((sce->zeroes[w*16+g] || !sce->band_alt[w*16+g]) && sfb_energy < threshold*sqrtf(1.0f/freq_boost)) || spread < spread_threshold ||
Claudio Freire01ecb712015-10-11 20:29:50569 (!sce->zeroes[w*16+g] && sce->band_alt[w*16+g] && sfb_energy > threshold*thr_mult*freq_boost) ||
570 min_energy < pns_transient_energy_r * max_energy ) {
Rostislav Pehlivanovda64bd62015-09-09 09:44:33571 sce->pns_ener[w*16+g] = sfb_energy;
Claudio Freireca203e92015-12-01 06:28:36572 if (!sce->zeroes[w*16+g])
573 prev_sf = sce->sf_idx[w*16+g];
Rostislav Pehlivanov033e5892015-09-06 14:13:18574 continue;
575 }
576
Claudio Freire01ecb712015-10-11 20:29:50577 pns_tgt_energy = sfb_energy*FFMIN(1.0f, spread*spread);
Claudio Freire9458a622015-09-25 06:56:32578 noise_sfi = av_clip(roundf(log2f(pns_tgt_energy)*2), -100, 155); /* Quantize */
Rostislav Pehlivanovb6cc8ec2015-09-07 11:39:04579 noise_amp = -ff_aac_pow2sf_tab[noise_sfi + POW_SF2_ZERO]; /* Dequantize */
Claudio Freireca203e92015-12-01 06:28:36580 if (prev != -1000) {
581 int noise_sfdiff = noise_sfi - prev + SCALE_DIFF_ZERO;
582 if (noise_sfdiff < 0 || noise_sfdiff > 2*SCALE_MAX_DIFF) {
583 if (!sce->zeroes[w*16+g])
584 prev_sf = sce->sf_idx[w*16+g];
585 continue;
586 }
587 }
Rostislav Pehlivanov033e5892015-09-06 14:13:18588 for (w2 = 0; w2 < sce->ics.group_len[w]; w2++) {
Claudio Freire9458a622015-09-25 06:56:32589 float band_energy, scale, pns_senergy;
Claudio Freire0f98fd32015-09-26 07:49:16590 const int start_c = (w+w2)*128+sce->ics.swb_offset[g];
Rostislav Pehlivanovda64bd62015-09-09 09:44:33591 band = &s->psy.ch[s->cur_channel].psy_bands[(w+w2)*16+g];
Rostislav Pehlivanov230178d2016-10-08 00:47:04592 for (i = 0; i < sce->ics.swb_sizes[g]; i++) {
593 s->random_state = lcg_random(s->random_state);
594 PNS[i] = s->random_state;
Rostislav Pehlivanovade31b92015-12-14 18:53:09595 }
Rostislav Pehlivanov033e5892015-09-06 14:13:18596 band_energy = s->fdsp->scalarproduct_float(PNS, PNS, sce->ics.swb_sizes[g]);
597 scale = noise_amp/sqrtf(band_energy);
598 s->fdsp->vector_fmul_scalar(PNS, PNS, scale, sce->ics.swb_sizes[g]);
Claudio Freire9458a622015-09-25 06:56:32599 pns_senergy = s->fdsp->scalarproduct_float(PNS, PNS, sce->ics.swb_sizes[g]);
600 pns_energy += pns_senergy;
Andreas Rheinhardt88b3b092024-02-28 12:29:19601 s->aacdsp.abs_pow34(NOR34, &sce->coeffs[start_c], sce->ics.swb_sizes[g]);
602 s->aacdsp.abs_pow34(PNS34, PNS, sce->ics.swb_sizes[g]);
Rostislav Pehlivanovda64bd62015-09-09 09:44:33603 dist1 += quantize_band_cost(s, &sce->coeffs[start_c],
Rostislav Pehlivanov033e5892015-09-06 14:13:18604 NOR34,
605 sce->ics.swb_sizes[g],
606 sce->sf_idx[(w+w2)*16+g],
607 sce->band_alt[(w+w2)*16+g],
Andreas Rheinhardt386990a2022-08-01 07:45:10608 lambda/band->threshold, INFINITY, NULL, NULL);
Claudio Freire01ecb712015-10-11 20:29:50609 /* Estimate rd on average as 5 bits for SF, 4 for the CB, plus spread energy * lambda/thr */
610 dist2 += band->energy/(band->spread*band->spread)*lambda*dist_thresh/band->threshold;
611 }
Claudio Freire124c3752015-12-09 20:36:32612 if (g && sce->band_type[w*16+g-1] == NOISE_BT) {
Claudio Freire01ecb712015-10-11 20:29:50613 dist2 += 5;
614 } else {
615 dist2 += 9;
Rostislav Pehlivanov033e5892015-09-06 14:13:18616 }
Claudio Freire9458a622015-09-25 06:56:32617 energy_ratio = pns_tgt_energy/pns_energy; /* Compensates for quantization error */
618 sce->pns_ener[w*16+g] = energy_ratio*pns_tgt_energy;
Claudio Freire01ecb712015-10-11 20:29:50619 if (sce->zeroes[w*16+g] || !sce->band_alt[w*16+g] || (energy_ratio > 0.85f && energy_ratio < 1.25f && dist2 < dist1)) {
Rostislav Pehlivanov033e5892015-09-06 14:13:18620 sce->band_type[w*16+g] = NOISE_BT;
621 sce->zeroes[w*16+g] = 0;
Claudio Freireca203e92015-12-01 06:28:36622 prev = noise_sfi;
Claudio Freire4720a562015-12-22 08:26:12623 } else {
624 if (!sce->zeroes[w*16+g])
625 prev_sf = sce->sf_idx[w*16+g];
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05626 }
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05627 }
628 }
629}
630
Claudio Freire01ecb712015-10-11 20:29:50631static void mark_pns(AACEncContext *s, AVCodecContext *avctx, SingleChannelElement *sce)
632{
633 FFPsyBand *band;
634 int w, g, w2;
635 int wlen = 1024 / sce->ics.num_windows;
636 int bandwidth, cutoff;
637 const float lambda = s->lambda;
638 const float freq_mult = avctx->sample_rate*0.5f/wlen;
639 const float spread_threshold = FFMIN(0.75f, NOISE_SPREAD_THRESHOLD*FFMAX(0.5f, lambda/100.f));
640 const float pns_transient_energy_r = FFMIN(0.7f, lambda / 140.f);
641
642 int refbits = avctx->bit_rate * 1024.0 / avctx->sample_rate
Anton Khirnov494760f2013-05-07 05:20:32643 / ((avctx->flags & AV_CODEC_FLAG_QSCALE) ? 2.0f : avctx->ch_layout.nb_channels)
Claudio Freire01ecb712015-10-11 20:29:50644 * (lambda / 120.f);
645
646 /** Keep this in sync with twoloop's cutoff selection */
647 float rate_bandwidth_multiplier = 1.5f;
James Almerf5c8d002017-03-26 00:35:15648 int frame_bit_rate = (avctx->flags & AV_CODEC_FLAG_QSCALE)
Claudio Freire01ecb712015-10-11 20:29:50649 ? (refbits * rate_bandwidth_multiplier * avctx->sample_rate / 1024)
Anton Khirnov494760f2013-05-07 05:20:32650 : (avctx->bit_rate / avctx->ch_layout.nb_channels);
Claudio Freire01ecb712015-10-11 20:29:50651
652 frame_bit_rate *= 1.15f;
653
654 if (avctx->cutoff > 0) {
655 bandwidth = avctx->cutoff;
656 } else {
657 bandwidth = FFMAX(3000, AAC_CUTOFF_FROM_BITRATE(frame_bit_rate, 1, avctx->sample_rate));
658 }
659
660 cutoff = bandwidth * 2 * wlen / avctx->sample_rate;
661
662 memcpy(sce->band_alt, sce->band_type, sizeof(sce->band_type));
663 for (w = 0; w < sce->ics.num_windows; w += sce->ics.group_len[w]) {
Rostislav Pehlivanov6612d042016-08-13 16:34:58664 for (g = 0; g < sce->ics.num_swb; g++) {
Claudio Freire01ecb712015-10-11 20:29:50665 float sfb_energy = 0.0f, threshold = 0.0f, spread = 2.0f;
666 float min_energy = -1.0f, max_energy = 0.0f;
667 const int start = sce->ics.swb_offset[g];
668 const float freq = start*freq_mult;
669 const float freq_boost = FFMAX(0.88f*freq/NOISE_LOW_LIMIT, 1.0f);
670 if (freq < NOISE_LOW_LIMIT || start >= cutoff) {
671 sce->can_pns[w*16+g] = 0;
672 continue;
673 }
674 for (w2 = 0; w2 < sce->ics.group_len[w]; w2++) {
675 band = &s->psy.ch[s->cur_channel].psy_bands[(w+w2)*16+g];
676 sfb_energy += band->energy;
677 spread = FFMIN(spread, band->spread);
678 threshold += band->threshold;
679 if (!w2) {
680 min_energy = max_energy = band->energy;
681 } else {
682 min_energy = FFMIN(min_energy, band->energy);
683 max_energy = FFMAX(max_energy, band->energy);
684 }
685 }
686
687 /* PNS is acceptable when all of these are true:
688 * 1. high spread energy (noise-like band)
689 * 2. near-threshold energy (high PE means the random nature of PNS content will be noticed)
690 * 3. on short window groups, all windows have similar energy (variations in energy would be destroyed by PNS)
691 */
692 sce->pns_ener[w*16+g] = sfb_energy;
693 if (sfb_energy < threshold*sqrtf(1.5f/freq_boost) || spread < spread_threshold || min_energy < pns_transient_energy_r * max_energy) {
694 sce->can_pns[w*16+g] = 0;
695 } else {
696 sce->can_pns[w*16+g] = 1;
697 }
698 }
699 }
700}
701
Rostislav Pehlivanov6d175152015-07-29 04:44:24702static void search_for_ms(AACEncContext *s, ChannelElement *cpe)
Alex Converse78e65cd2009-07-08 20:01:31703{
Claudio Freireca203e92015-12-01 06:28:36704 int start = 0, i, w, w2, g, sid_sf_boost, prev_mid, prev_side;
705 uint8_t nextband0[128], nextband1[128];
Rostislav Pehlivanovd2ae5f72016-10-08 14:59:14706 float *M = s->scoefs + 128*0, *S = s->scoefs + 128*1;
707 float *L34 = s->scoefs + 128*2, *R34 = s->scoefs + 128*3;
708 float *M34 = s->scoefs + 128*4, *S34 = s->scoefs + 128*5;
Rostislav Pehlivanov6d175152015-07-29 04:44:24709 const float lambda = s->lambda;
Claudio Freire01ecb712015-10-11 20:29:50710 const float mslambda = FFMIN(1.0f, lambda / 120.f);
Alex Converse78e65cd2009-07-08 20:01:31711 SingleChannelElement *sce0 = &cpe->ch[0];
712 SingleChannelElement *sce1 = &cpe->ch[1];
Alex Conversefd257dc2009-07-08 20:36:45713 if (!cpe->common_window)
Alex Converse78e65cd2009-07-08 20:01:31714 return;
Claudio Freire01ecb712015-10-11 20:29:50715
Claudio Freireca203e92015-12-01 06:28:36716 /** Scout out next nonzero bands */
717 ff_init_nextband_map(sce0, nextband0);
718 ff_init_nextband_map(sce1, nextband1);
719
720 prev_mid = sce0->sf_idx[0];
721 prev_side = sce1->sf_idx[0];
722 for (w = 0; w < sce0->ics.num_windows; w += sce0->ics.group_len[w]) {
Rostislav Pehlivanov57848ef2015-07-02 18:13:02723 start = 0;
Rostislav Pehlivanov6612d042016-08-13 16:34:58724 for (g = 0; g < sce0->ics.num_swb; g++) {
Claudio Freire01ecb712015-10-11 20:29:50725 float bmax = bval2bmax(g * 17.0f / sce0->ics.num_swb) / 0.0045f;
Claudio Freire6711aa22016-01-08 08:31:32726 if (!cpe->is_mask[w*16+g])
727 cpe->ms_mask[w*16+g] = 0;
728 if (!sce0->zeroes[w*16+g] && !sce1->zeroes[w*16+g] && !cpe->is_mask[w*16+g]) {
Claudio Freire01ecb712015-10-11 20:29:50729 float Mmax = 0.0f, Smax = 0.0f;
730
731 /* Must compute mid/side SF and book for the whole window group */
Alex Conversefd257dc2009-07-08 20:36:45732 for (w2 = 0; w2 < sce0->ics.group_len[w]; w2++) {
Alex Conversefd257dc2009-07-08 20:36:45733 for (i = 0; i < sce0->ics.swb_sizes[g]; i++) {
Rostislav Pehlivanov32be2642015-08-21 17:30:51734 M[i] = (sce0->coeffs[start+(w+w2)*128+i]
735 + sce1->coeffs[start+(w+w2)*128+i]) * 0.5;
Young Han Lee92efa2b2011-03-24 01:49:36736 S[i] = M[i]
Rostislav Pehlivanov32be2642015-08-21 17:30:51737 - sce1->coeffs[start+(w+w2)*128+i];
Alex Converse78e65cd2009-07-08 20:01:31738 }
Andreas Rheinhardt88b3b092024-02-28 12:29:19739 s->aacdsp.abs_pow34(M34, M, sce0->ics.swb_sizes[g]);
740 s->aacdsp.abs_pow34(S34, S, sce0->ics.swb_sizes[g]);
Claudio Freire01ecb712015-10-11 20:29:50741 for (i = 0; i < sce0->ics.swb_sizes[g]; i++ ) {
742 Mmax = FFMAX(Mmax, M34[i]);
743 Smax = FFMAX(Smax, S34[i]);
744 }
Alex Converse78e65cd2009-07-08 20:01:31745 }
Claudio Freire01ecb712015-10-11 20:29:50746
747 for (sid_sf_boost = 0; sid_sf_boost < 4; sid_sf_boost++) {
748 float dist1 = 0.0f, dist2 = 0.0f;
749 int B0 = 0, B1 = 0;
750 int minidx;
751 int mididx, sididx;
752 int midcb, sidcb;
753
754 minidx = FFMIN(sce0->sf_idx[w*16+g], sce1->sf_idx[w*16+g]);
Claudio Freireca203e92015-12-01 06:28:36755 mididx = av_clip(minidx, 0, SCALE_MAX_POS - SCALE_DIV_512);
756 sididx = av_clip(minidx - sid_sf_boost * 3, 0, SCALE_MAX_POS - SCALE_DIV_512);
Claudio Freire6711aa22016-01-08 08:31:32757 if (sce0->band_type[w*16+g] != NOISE_BT && sce1->band_type[w*16+g] != NOISE_BT
Claudio Freireca203e92015-12-01 06:28:36758 && ( !ff_sfdelta_can_replace(sce0, nextband0, prev_mid, mididx, w*16+g)
759 || !ff_sfdelta_can_replace(sce1, nextband1, prev_side, sididx, w*16+g))) {
Claudio Freire01ecb712015-10-11 20:29:50760 /* scalefactor range violation, bad stuff, will decrease quality unacceptably */
761 continue;
762 }
763
Claudio Freireca203e92015-12-01 06:28:36764 midcb = find_min_book(Mmax, mididx);
765 sidcb = find_min_book(Smax, sididx);
766
Claudio Freire01ecb712015-10-11 20:29:50767 /* No CB can be zero */
768 midcb = FFMAX(1,midcb);
769 sidcb = FFMAX(1,sidcb);
770
771 for (w2 = 0; w2 < sce0->ics.group_len[w]; w2++) {
772 FFPsyBand *band0 = &s->psy.ch[s->cur_channel+0].psy_bands[(w+w2)*16+g];
773 FFPsyBand *band1 = &s->psy.ch[s->cur_channel+1].psy_bands[(w+w2)*16+g];
774 float minthr = FFMIN(band0->threshold, band1->threshold);
775 int b1,b2,b3,b4;
776 for (i = 0; i < sce0->ics.swb_sizes[g]; i++) {
777 M[i] = (sce0->coeffs[start+(w+w2)*128+i]
778 + sce1->coeffs[start+(w+w2)*128+i]) * 0.5;
779 S[i] = M[i]
780 - sce1->coeffs[start+(w+w2)*128+i];
781 }
782
Andreas Rheinhardt88b3b092024-02-28 12:29:19783 s->aacdsp.abs_pow34(L34, sce0->coeffs+start+(w+w2)*128, sce0->ics.swb_sizes[g]);
784 s->aacdsp.abs_pow34(R34, sce1->coeffs+start+(w+w2)*128, sce0->ics.swb_sizes[g]);
785 s->aacdsp.abs_pow34(M34, M, sce0->ics.swb_sizes[g]);
786 s->aacdsp.abs_pow34(S34, S, sce0->ics.swb_sizes[g]);
Claudio Freire01ecb712015-10-11 20:29:50787 dist1 += quantize_band_cost(s, &sce0->coeffs[start + (w+w2)*128],
788 L34,
789 sce0->ics.swb_sizes[g],
Claudio Freire6711aa22016-01-08 08:31:32790 sce0->sf_idx[w*16+g],
791 sce0->band_type[w*16+g],
Andreas Rheinhardt386990a2022-08-01 07:45:10792 lambda / (band0->threshold + FLT_MIN), INFINITY, &b1, NULL);
Claudio Freire01ecb712015-10-11 20:29:50793 dist1 += quantize_band_cost(s, &sce1->coeffs[start + (w+w2)*128],
794 R34,
795 sce1->ics.swb_sizes[g],
Claudio Freire6711aa22016-01-08 08:31:32796 sce1->sf_idx[w*16+g],
797 sce1->band_type[w*16+g],
Andreas Rheinhardt386990a2022-08-01 07:45:10798 lambda / (band1->threshold + FLT_MIN), INFINITY, &b2, NULL);
Claudio Freire01ecb712015-10-11 20:29:50799 dist2 += quantize_band_cost(s, M,
800 M34,
801 sce0->ics.swb_sizes[g],
Claudio Freire6711aa22016-01-08 08:31:32802 mididx,
803 midcb,
Andreas Rheinhardt386990a2022-08-01 07:45:10804 lambda / (minthr + FLT_MIN), INFINITY, &b3, NULL);
Claudio Freire01ecb712015-10-11 20:29:50805 dist2 += quantize_band_cost(s, S,
806 S34,
807 sce1->ics.swb_sizes[g],
Claudio Freire6711aa22016-01-08 08:31:32808 sididx,
809 sidcb,
Andreas Rheinhardt386990a2022-08-01 07:45:10810 mslambda / (minthr * bmax + FLT_MIN), INFINITY, &b4, NULL);
Claudio Freire01ecb712015-10-11 20:29:50811 B0 += b1+b2;
812 B1 += b3+b4;
Claudio Freire6711aa22016-01-08 08:31:32813 dist1 -= b1+b2;
814 dist2 -= b3+b4;
Claudio Freire01ecb712015-10-11 20:29:50815 }
816 cpe->ms_mask[w*16+g] = dist2 <= dist1 && B1 < B0;
817 if (cpe->ms_mask[w*16+g]) {
Claudio Freire6711aa22016-01-08 08:31:32818 if (sce0->band_type[w*16+g] != NOISE_BT && sce1->band_type[w*16+g] != NOISE_BT) {
Claudio Freire01ecb712015-10-11 20:29:50819 sce0->sf_idx[w*16+g] = mididx;
820 sce1->sf_idx[w*16+g] = sididx;
821 sce0->band_type[w*16+g] = midcb;
822 sce1->band_type[w*16+g] = sidcb;
Claudio Freire6711aa22016-01-08 08:31:32823 } else if ((sce0->band_type[w*16+g] != NOISE_BT) ^ (sce1->band_type[w*16+g] != NOISE_BT)) {
824 /* ms_mask unneeded, and it confuses some decoders */
825 cpe->ms_mask[w*16+g] = 0;
Claudio Freire01ecb712015-10-11 20:29:50826 }
827 break;
828 } else if (B1 > B0) {
829 /* More boost won't fix this */
830 break;
831 }
832 }
Alex Converse78e65cd2009-07-08 20:01:31833 }
Claudio Freireca203e92015-12-01 06:28:36834 if (!sce0->zeroes[w*16+g] && sce0->band_type[w*16+g] < RESERVED_BT)
835 prev_mid = sce0->sf_idx[w*16+g];
836 if (!sce1->zeroes[w*16+g] && !cpe->is_mask[w*16+g] && sce1->band_type[w*16+g] < RESERVED_BT)
837 prev_side = sce1->sf_idx[w*16+g];
Alex Converse78e65cd2009-07-08 20:01:31838 start += sce0->ics.swb_sizes[g];
839 }
840 }
841}
842
James Almer318778d2017-09-26 18:58:40843const AACCoefficientsEncoder ff_aac_coders[AAC_CODER_NB] = {
Timothy Gu4bd910d2013-09-11 03:23:32844 [AAC_CODER_TWOLOOP] = {
Alex Converse78e65cd2009-07-08 20:01:31845 search_for_quantizers_twoloop,
Alex Converse759510e2010-05-14 16:49:51846 codebook_trellis_rate,
Alex Converse78e65cd2009-07-08 20:01:31847 quantize_and_encode_band,
Timothy Gu21dd5272015-08-22 05:11:23848 ff_aac_encode_tns_info,
Rostislav Pehlivanovf20b6712015-08-29 05:47:31849 ff_aac_apply_tns,
Rostislav Pehlivanove06578e2015-07-02 18:13:04850 set_special_band_scalefactors,
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05851 search_for_pns,
Claudio Freire01ecb712015-10-11 20:29:50852 mark_pns,
Timothy Gu21dd5272015-08-22 05:11:23853 ff_aac_search_for_tns,
Alex Conversedd0e43e2009-08-27 17:46:13854 search_for_ms,
Timothy Gu21dd5272015-08-22 05:11:23855 ff_aac_search_for_is,
Alex Converse78e65cd2009-07-08 20:01:31856 },
Timothy Gu4bd910d2013-09-11 03:23:32857 [AAC_CODER_FAST] = {
Alex Converse78e65cd2009-07-08 20:01:31858 search_for_quantizers_fast,
Rostislav Pehlivanovc92cc2d2016-08-06 23:47:31859 codebook_trellis_rate,
Alex Converse78e65cd2009-07-08 20:01:31860 quantize_and_encode_band,
Timothy Gu21dd5272015-08-22 05:11:23861 ff_aac_encode_tns_info,
Rostislav Pehlivanovf20b6712015-08-29 05:47:31862 ff_aac_apply_tns,
Rostislav Pehlivanove06578e2015-07-02 18:13:04863 set_special_band_scalefactors,
Rostislav Pehlivanov38fd4c22015-07-02 18:13:05864 search_for_pns,
Claudio Freire01ecb712015-10-11 20:29:50865 mark_pns,
Timothy Gu21dd5272015-08-22 05:11:23866 ff_aac_search_for_tns,
Alex Conversedd0e43e2009-08-27 17:46:13867 search_for_ms,
Timothy Gu21dd5272015-08-22 05:11:23868 ff_aac_search_for_is,
Alex Converse78e65cd2009-07-08 20:01:31869 },
870};