2 * AAC encoder utilities
3 * Copyright (C) 2015 Rostislav Pehlivanov
5 * This file is part of FFmpeg.
7 * FFmpeg is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * FFmpeg is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with FFmpeg; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
24 * AAC encoder utilities
25 * @author Rostislav Pehlivanov ( atomnuker gmail com )
28 #ifndef AVCODEC_AACENC_UTILS_H
29 #define AVCODEC_AACENC_UTILS_H
31 #include "libavutil/ffmath.h"
33 #include "aacenctab.h"
36 #define ROUND_STANDARD 0.4054f
37 #define ROUND_TO_ZERO 0.1054f
38 #define C_QUANT 0.4054f
40 static inline float pos_pow34(float a
)
42 return sqrtf(a
* sqrtf(a
));
46 * Quantize one coefficient.
47 * @return absolute value of the quantized coefficient
48 * @see 3GPP TS26.403 5.6.2 "Scalefactor determination"
50 static inline int quant(float coef
, const float Q
, const float rounding
)
53 return sqrtf(a
* sqrtf(a
)) + rounding
;
56 static inline float find_max_val(int group_len
, int swb_size
, const float *scaled
)
60 for (w2
= 0; w2
< group_len
; w2
++) {
61 for (i
= 0; i
< swb_size
; i
++) {
62 maxval
= FFMAX(maxval
, scaled
[w2
*128+i
]);
68 static inline int find_min_book(float maxval
, int sf
)
70 float Q34
= ff_aac_pow34sf_tab
[POW_SF2_ZERO
- sf
+ SCALE_ONE_POS
- SCALE_DIV_512
];
72 qmaxval
= maxval
* Q34
+ C_QUANT
;
73 if (qmaxval
>= (FF_ARRAY_ELEMS(aac_maxval_cb
)))
76 cb
= aac_maxval_cb
[qmaxval
];
80 static inline float find_form_factor(int group_len
, int swb_size
, float thresh
,
81 const float *scaled
, float nzslope
) {
82 const float iswb_size
= 1.0f
/ swb_size
;
83 const float iswb_sizem1
= 1.0f
/ (swb_size
- 1);
84 const float ethresh
= thresh
;
85 float form
= 0.0f
, weight
= 0.0f
;
87 for (w2
= 0; w2
< group_len
; w2
++) {
88 float e
= 0.0f
, e2
= 0.0f
, var
= 0.0f
, maxval
= 0.0f
;
90 for (i
= 0; i
< swb_size
; i
++) {
91 float s
= fabsf(scaled
[w2
*128+i
]);
92 maxval
= FFMAX(maxval
, s
);
95 /* We really don't want a hard non-zero-line count, since
96 * even below-threshold lines do add up towards band spectral power.
97 * So, fall steeply towards zero, but smoothly
103 nzl
+= (s
/ ethresh
) * (s
/ ethresh
);
105 nzl
+= ff_fast_powf(s
/ ethresh
, nzslope
);
112 /** compute variance */
113 for (i
= 0; i
< swb_size
; i
++) {
114 float d
= fabsf(scaled
[w2
*128+i
]) - e
;
117 var
= sqrtf(var
* iswb_sizem1
);
120 frm
= e
/ FFMIN(e
+4*var
,maxval
);
121 form
+= e2
* sqrtf(frm
) / FFMAX(0.5f
,nzl
);
126 return form
/ weight
;
132 /** Return the minimum scalefactor where the quantized coef does not clip. */
133 static inline uint8_t coef2minsf(float coef
)
135 return av_clip_uint8(log2f(coef
)*4 - 69 + SCALE_ONE_POS
- SCALE_DIV_512
);
138 /** Return the maximum scalefactor where the quantized coef is not zero. */
139 static inline uint8_t coef2maxsf(float coef
)
141 return av_clip_uint8(log2f(coef
)*4 + 6 + SCALE_ONE_POS
- SCALE_DIV_512
);
145 * Returns the closest possible index to an array of float values, given a value.
147 static inline int quant_array_idx(const float val
, const float *arr
, const int num
)
150 float quant_min_err
= INFINITY
;
151 for (i
= 0; i
< num
; i
++) {
152 float error
= (val
- arr
[i
])*(val
- arr
[i
]);
153 if (error
< quant_min_err
) {
154 quant_min_err
= error
;
162 * approximates exp10f(-3.0f*(0.5f + 0.5f * cosf(FFMIN(b,15.5f) / 15.5f)))
164 static av_always_inline
float bval2bmax(float b
)
166 return 0.001f
+ 0.0035f
* (b
*b
*b
) / (15.5f
*15.5f
*15.5f
);
170 * Compute a nextband map to be used with SF delta constraint utilities.
171 * The nextband array should contain 128 elements, and positions that don't
172 * map to valid, nonzero bands of the form w*16+g (with w being the initial
173 * window of the window group, only) are left indetermined.
175 static inline void ff_init_nextband_map(const SingleChannelElement
*sce
, uint8_t *nextband
)
177 unsigned char prevband
= 0;
179 /** Just a safe default */
180 for (g
= 0; g
< 128; g
++)
183 /** Now really navigate the nonzero band chain */
184 for (w
= 0; w
< sce
->ics
.num_windows
; w
+= sce
->ics
.group_len
[w
]) {
185 for (g
= 0; g
< sce
->ics
.num_swb
; g
++) {
186 if (!sce
->zeroes
[w
*16+g
] && sce
->band_type
[w
*16+g
] < RESERVED_BT
)
187 prevband
= nextband
[prevband
] = w
*16+g
;
190 nextband
[prevband
] = prevband
; /* terminate */
194 * Updates nextband to reflect a removed band (equivalent to
195 * calling ff_init_nextband_map after marking a band as zero)
197 static inline void ff_nextband_remove(uint8_t *nextband
, int prevband
, int band
)
199 nextband
[prevband
] = nextband
[band
];
203 * Checks whether the specified band could be removed without inducing
204 * scalefactor delta that violates SF delta encoding constraints.
205 * prev_sf has to be the scalefactor of the previous nonzero, nonspecial
206 * band, in encoding order, or negative if there was no such band.
208 static inline int ff_sfdelta_can_remove_band(const SingleChannelElement
*sce
,
209 const uint8_t *nextband
, int prev_sf
, int band
)
212 && sce
->sf_idx
[nextband
[band
]] >= (prev_sf
- SCALE_MAX_DIFF
)
213 && sce
->sf_idx
[nextband
[band
]] <= (prev_sf
+ SCALE_MAX_DIFF
);
217 * Checks whether the specified band's scalefactor could be replaced
218 * with another one without violating SF delta encoding constraints.
219 * prev_sf has to be the scalefactor of the previous nonzero, nonsepcial
220 * band, in encoding order, or negative if there was no such band.
222 static inline int ff_sfdelta_can_replace(const SingleChannelElement
*sce
,
223 const uint8_t *nextband
, int prev_sf
, int new_sf
, int band
)
225 return new_sf
>= (prev_sf
- SCALE_MAX_DIFF
)
226 && new_sf
<= (prev_sf
+ SCALE_MAX_DIFF
)
227 && sce
->sf_idx
[nextband
[band
]] >= (new_sf
- SCALE_MAX_DIFF
)
228 && sce
->sf_idx
[nextband
[band
]] <= (new_sf
+ SCALE_MAX_DIFF
);
232 * linear congruential pseudorandom number generator
234 * @param previous_val pointer to the current state of the generator
236 * @return Returns a 32-bit pseudorandom integer
238 static av_always_inline
int lcg_random(unsigned previous_val
)
240 union { unsigned u
; int s
; } v
= { previous_val
* 1664525u + 1013904223 };
244 #define ERROR_IF(cond, ...) \
246 av_log(avctx, AV_LOG_ERROR, __VA_ARGS__); \
247 return AVERROR(EINVAL); \
250 #define WARN_IF(cond, ...) \
252 av_log(avctx, AV_LOG_WARNING, __VA_ARGS__); \
255 #endif /* AVCODEC_AACENC_UTILS_H */