2051 lines
64 KiB
C
2051 lines
64 KiB
C
/*
|
|
* MP3 quantization
|
|
*
|
|
* Copyright (c) 1999-2000 Mark Taylor
|
|
* Copyright (c) 1999-2003 Takehiro Tominaga
|
|
* Copyright (c) 2000-2011 Robert Hegemann
|
|
* Copyright (c) 2001-2005 Gabriel Bouvigne
|
|
*
|
|
* This library is free software; you can redistribute it and/or
|
|
* modify it under the terms of the GNU Library General Public
|
|
* License as published by the Free Software Foundation; either
|
|
* version 2 of the License, or (at your option) any later version.
|
|
*
|
|
* This library is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
* Library General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU Library General Public
|
|
* License along with this library; if not, write to the
|
|
* Free Software Foundation, Inc., 59 Temple Place - Suite 330,
|
|
* Boston, MA 02111-1307, USA.
|
|
*/
|
|
|
|
/* $Id: quantize.c,v 1.219 2017/08/02 19:48:05 robert Exp $ */
|
|
|
|
#ifdef HAVE_CONFIG_H
|
|
# include <config.h>
|
|
#endif
|
|
|
|
#include "lame.h"
|
|
#include "machine.h"
|
|
#include "encoder.h"
|
|
#include "util.h"
|
|
#include "quantize_pvt.h"
|
|
#include "reservoir.h"
|
|
#include "bitstream.h"
|
|
#include "vbrquantize.h"
|
|
#include "quantize.h"
|
|
#ifdef HAVE_XMMINTRIN_H
|
|
#include "vector/lame_intrin.h"
|
|
#endif
|
|
|
|
|
|
|
|
|
|
/* convert from L/R <-> Mid/Side */
|
|
static void
|
|
ms_convert(III_side_info_t * l3_side, int gr)
|
|
{
|
|
int i;
|
|
for (i = 0; i < 576; ++i) {
|
|
FLOAT l, r;
|
|
l = l3_side->tt[gr][0].xr[i];
|
|
r = l3_side->tt[gr][1].xr[i];
|
|
l3_side->tt[gr][0].xr[i] = (l + r) * (FLOAT) (SQRT2 * 0.5);
|
|
l3_side->tt[gr][1].xr[i] = (l - r) * (FLOAT) (SQRT2 * 0.5);
|
|
}
|
|
}
|
|
|
|
/************************************************************************
|
|
*
|
|
* init_outer_loop()
|
|
* mt 6/99
|
|
*
|
|
* initializes cod_info, scalefac and xrpow
|
|
*
|
|
* returns 0 if all energies in xr are zero, else 1
|
|
*
|
|
************************************************************************/
|
|
|
|
static void
|
|
init_xrpow_core_c(gr_info * const cod_info, FLOAT xrpow[576], int upper, FLOAT * sum)
|
|
{
|
|
int i;
|
|
FLOAT tmp;
|
|
*sum = 0;
|
|
for (i = 0; i <= upper; ++i) {
|
|
tmp = fabs(cod_info->xr[i]);
|
|
*sum += tmp;
|
|
xrpow[i] = sqrt(tmp * sqrt(tmp));
|
|
|
|
if (xrpow[i] > cod_info->xrpow_max)
|
|
cod_info->xrpow_max = xrpow[i];
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
void
|
|
init_xrpow_core_init(lame_internal_flags * const gfc)
|
|
{
|
|
gfc->init_xrpow_core = init_xrpow_core_c;
|
|
|
|
#if defined(HAVE_XMMINTRIN_H)
|
|
if (gfc->CPU_features.SSE)
|
|
gfc->init_xrpow_core = init_xrpow_core_sse;
|
|
#endif
|
|
#ifndef HAVE_NASM
|
|
#ifdef MIN_ARCH_SSE
|
|
gfc->init_xrpow_core = init_xrpow_core_sse;
|
|
#endif
|
|
#endif
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
init_xrpow(lame_internal_flags * gfc, gr_info * const cod_info, FLOAT xrpow[576])
|
|
{
|
|
FLOAT sum = 0;
|
|
int i;
|
|
int const upper = cod_info->max_nonzero_coeff;
|
|
|
|
assert(xrpow != NULL);
|
|
cod_info->xrpow_max = 0;
|
|
|
|
/* check if there is some energy we have to quantize
|
|
* and calculate xrpow matching our fresh scalefactors
|
|
*/
|
|
assert(0 <= upper && upper <= 575);
|
|
memset(&(xrpow[upper]), 0, (576 - upper) * sizeof(xrpow[0]));
|
|
|
|
|
|
gfc->init_xrpow_core(cod_info, xrpow, upper, &sum);
|
|
|
|
/* return 1 if we have something to quantize, else 0
|
|
*/
|
|
if (sum > (FLOAT) 1E-20) {
|
|
int j = 0;
|
|
if (gfc->sv_qnt.substep_shaping & 2)
|
|
j = 1;
|
|
|
|
for (i = 0; i < cod_info->psymax; i++)
|
|
gfc->sv_qnt.pseudohalf[i] = j;
|
|
|
|
return 1;
|
|
}
|
|
|
|
memset(&cod_info->l3_enc[0], 0, sizeof(int) * 576);
|
|
return 0;
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/*
|
|
Gabriel Bouvigne feb/apr 2003
|
|
Analog silence detection in partitionned sfb21
|
|
or sfb12 for short blocks
|
|
|
|
From top to bottom of sfb, changes to 0
|
|
coeffs which are below ath. It stops on the first
|
|
coeff higher than ath.
|
|
*/
|
|
static void
|
|
psfb21_analogsilence(lame_internal_flags const *gfc, gr_info * const cod_info)
|
|
{
|
|
ATH_t const *const ATH = gfc->ATH;
|
|
FLOAT *const xr = cod_info->xr;
|
|
|
|
if (cod_info->block_type != SHORT_TYPE) { /* NORM, START or STOP type, but not SHORT blocks */
|
|
int gsfb;
|
|
int stop = 0;
|
|
for (gsfb = PSFB21 - 1; gsfb >= 0 && !stop; gsfb--) {
|
|
int const start = gfc->scalefac_band.psfb21[gsfb];
|
|
int const end = gfc->scalefac_band.psfb21[gsfb + 1];
|
|
int j;
|
|
FLOAT ath21;
|
|
ath21 = athAdjust(ATH->adjust_factor, ATH->psfb21[gsfb], ATH->floor, 0);
|
|
|
|
if (gfc->sv_qnt.longfact[21] > 1e-12f)
|
|
ath21 *= gfc->sv_qnt.longfact[21];
|
|
|
|
for (j = end - 1; j >= start; j--) {
|
|
if (fabs(xr[j]) < ath21)
|
|
xr[j] = 0;
|
|
else {
|
|
stop = 1;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
else {
|
|
/*note: short blocks coeffs are reordered */
|
|
int block;
|
|
for (block = 0; block < 3; block++) {
|
|
|
|
int gsfb;
|
|
int stop = 0;
|
|
for (gsfb = PSFB12 - 1; gsfb >= 0 && !stop; gsfb--) {
|
|
int const start = gfc->scalefac_band.s[12] * 3 +
|
|
(gfc->scalefac_band.s[13] - gfc->scalefac_band.s[12]) * block +
|
|
(gfc->scalefac_band.psfb12[gsfb] - gfc->scalefac_band.psfb12[0]);
|
|
int const end =
|
|
start + (gfc->scalefac_band.psfb12[gsfb + 1] - gfc->scalefac_band.psfb12[gsfb]);
|
|
int j;
|
|
FLOAT ath12;
|
|
ath12 = athAdjust(ATH->adjust_factor, ATH->psfb12[gsfb], ATH->floor, 0);
|
|
|
|
if (gfc->sv_qnt.shortfact[12] > 1e-12f)
|
|
ath12 *= gfc->sv_qnt.shortfact[12];
|
|
|
|
for (j = end - 1; j >= start; j--) {
|
|
if (fabs(xr[j]) < ath12)
|
|
xr[j] = 0;
|
|
else {
|
|
stop = 1;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
static void
|
|
init_outer_loop(lame_internal_flags const *gfc, gr_info * const cod_info)
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
int sfb, j;
|
|
/* initialize fresh cod_info
|
|
*/
|
|
cod_info->part2_3_length = 0;
|
|
cod_info->big_values = 0;
|
|
cod_info->count1 = 0;
|
|
cod_info->global_gain = 210;
|
|
cod_info->scalefac_compress = 0;
|
|
/* mixed_block_flag, block_type was set in psymodel.c */
|
|
cod_info->table_select[0] = 0;
|
|
cod_info->table_select[1] = 0;
|
|
cod_info->table_select[2] = 0;
|
|
cod_info->subblock_gain[0] = 0;
|
|
cod_info->subblock_gain[1] = 0;
|
|
cod_info->subblock_gain[2] = 0;
|
|
cod_info->subblock_gain[3] = 0; /* this one is always 0 */
|
|
cod_info->region0_count = 0;
|
|
cod_info->region1_count = 0;
|
|
cod_info->preflag = 0;
|
|
cod_info->scalefac_scale = 0;
|
|
cod_info->count1table_select = 0;
|
|
cod_info->part2_length = 0;
|
|
if (cfg->samplerate_out <= 8000) {
|
|
cod_info->sfb_lmax = 17;
|
|
cod_info->sfb_smin = 9;
|
|
cod_info->psy_lmax = 17;
|
|
}
|
|
else {
|
|
cod_info->sfb_lmax = SBPSY_l;
|
|
cod_info->sfb_smin = SBPSY_s;
|
|
cod_info->psy_lmax = gfc->sv_qnt.sfb21_extra ? SBMAX_l : SBPSY_l;
|
|
}
|
|
cod_info->psymax = cod_info->psy_lmax;
|
|
cod_info->sfbmax = cod_info->sfb_lmax;
|
|
cod_info->sfbdivide = 11;
|
|
for (sfb = 0; sfb < SBMAX_l; sfb++) {
|
|
cod_info->width[sfb]
|
|
= gfc->scalefac_band.l[sfb + 1] - gfc->scalefac_band.l[sfb];
|
|
cod_info->window[sfb] = 3; /* which is always 0. */
|
|
}
|
|
if (cod_info->block_type == SHORT_TYPE) {
|
|
FLOAT ixwork[576];
|
|
FLOAT *ix;
|
|
|
|
cod_info->sfb_smin = 0;
|
|
cod_info->sfb_lmax = 0;
|
|
if (cod_info->mixed_block_flag) {
|
|
/*
|
|
* MPEG-1: sfbs 0-7 long block, 3-12 short blocks
|
|
* MPEG-2(.5): sfbs 0-5 long block, 3-12 short blocks
|
|
*/
|
|
cod_info->sfb_smin = 3;
|
|
cod_info->sfb_lmax = cfg->mode_gr * 2 + 4;
|
|
}
|
|
if (cfg->samplerate_out <= 8000) {
|
|
cod_info->psymax
|
|
= cod_info->sfb_lmax
|
|
+ 3 * (9 - cod_info->sfb_smin);
|
|
cod_info->sfbmax = cod_info->sfb_lmax + 3 * (9 - cod_info->sfb_smin);
|
|
}
|
|
else {
|
|
cod_info->psymax
|
|
= cod_info->sfb_lmax
|
|
+ 3 * ((gfc->sv_qnt.sfb21_extra ? SBMAX_s : SBPSY_s) - cod_info->sfb_smin);
|
|
cod_info->sfbmax = cod_info->sfb_lmax + 3 * (SBPSY_s - cod_info->sfb_smin);
|
|
}
|
|
cod_info->sfbdivide = cod_info->sfbmax - 18;
|
|
cod_info->psy_lmax = cod_info->sfb_lmax;
|
|
/* re-order the short blocks, for more efficient encoding below */
|
|
/* By Takehiro TOMINAGA */
|
|
/*
|
|
Within each scalefactor band, data is given for successive
|
|
time windows, beginning with window 0 and ending with window 2.
|
|
Within each window, the quantized values are then arranged in
|
|
order of increasing frequency...
|
|
*/
|
|
ix = &cod_info->xr[gfc->scalefac_band.l[cod_info->sfb_lmax]];
|
|
memcpy(ixwork, cod_info->xr, 576 * sizeof(FLOAT));
|
|
for (sfb = cod_info->sfb_smin; sfb < SBMAX_s; sfb++) {
|
|
int const start = gfc->scalefac_band.s[sfb];
|
|
int const end = gfc->scalefac_band.s[sfb + 1];
|
|
int window, l;
|
|
for (window = 0; window < 3; window++) {
|
|
for (l = start; l < end; l++) {
|
|
*ix++ = ixwork[3 * l + window];
|
|
}
|
|
}
|
|
}
|
|
|
|
j = cod_info->sfb_lmax;
|
|
for (sfb = cod_info->sfb_smin; sfb < SBMAX_s; sfb++) {
|
|
cod_info->width[j] = cod_info->width[j + 1] = cod_info->width[j + 2]
|
|
= gfc->scalefac_band.s[sfb + 1] - gfc->scalefac_band.s[sfb];
|
|
cod_info->window[j] = 0;
|
|
cod_info->window[j + 1] = 1;
|
|
cod_info->window[j + 2] = 2;
|
|
j += 3;
|
|
}
|
|
}
|
|
|
|
cod_info->count1bits = 0;
|
|
cod_info->sfb_partition_table = nr_of_sfb_block[0][0];
|
|
cod_info->slen[0] = 0;
|
|
cod_info->slen[1] = 0;
|
|
cod_info->slen[2] = 0;
|
|
cod_info->slen[3] = 0;
|
|
|
|
cod_info->max_nonzero_coeff = 575;
|
|
|
|
/* fresh scalefactors are all zero
|
|
*/
|
|
memset(cod_info->scalefac, 0, sizeof(cod_info->scalefac));
|
|
|
|
if (cfg->vbr != vbr_mt && cfg->vbr != vbr_mtrh && cfg->vbr != vbr_abr && cfg->vbr != vbr_off) {
|
|
psfb21_analogsilence(gfc, cod_info);
|
|
}
|
|
}
|
|
|
|
|
|
|
|
/************************************************************************
|
|
*
|
|
* bin_search_StepSize()
|
|
*
|
|
* author/date??
|
|
*
|
|
* binary step size search
|
|
* used by outer_loop to get a quantizer step size to start with
|
|
*
|
|
************************************************************************/
|
|
|
|
typedef enum {
|
|
BINSEARCH_NONE,
|
|
BINSEARCH_UP,
|
|
BINSEARCH_DOWN
|
|
} binsearchDirection_t;
|
|
|
|
static int
|
|
bin_search_StepSize(lame_internal_flags * const gfc, gr_info * const cod_info,
|
|
int desired_rate, const int ch, const FLOAT xrpow[576])
|
|
{
|
|
int nBits;
|
|
int CurrentStep = gfc->sv_qnt.CurrentStep[ch];
|
|
int flag_GoneOver = 0;
|
|
int const start = gfc->sv_qnt.OldValue[ch];
|
|
binsearchDirection_t Direction = BINSEARCH_NONE;
|
|
cod_info->global_gain = start;
|
|
desired_rate -= cod_info->part2_length;
|
|
|
|
assert(CurrentStep);
|
|
for (;;) {
|
|
int step;
|
|
nBits = count_bits(gfc, xrpow, cod_info, 0);
|
|
|
|
if (CurrentStep == 1 || nBits == desired_rate)
|
|
break; /* nothing to adjust anymore */
|
|
|
|
if (nBits > desired_rate) {
|
|
/* increase Quantize_StepSize */
|
|
if (Direction == BINSEARCH_DOWN)
|
|
flag_GoneOver = 1;
|
|
|
|
if (flag_GoneOver)
|
|
CurrentStep /= 2;
|
|
Direction = BINSEARCH_UP;
|
|
step = CurrentStep;
|
|
}
|
|
else {
|
|
/* decrease Quantize_StepSize */
|
|
if (Direction == BINSEARCH_UP)
|
|
flag_GoneOver = 1;
|
|
|
|
if (flag_GoneOver)
|
|
CurrentStep /= 2;
|
|
Direction = BINSEARCH_DOWN;
|
|
step = -CurrentStep;
|
|
}
|
|
cod_info->global_gain += step;
|
|
if (cod_info->global_gain < 0) {
|
|
cod_info->global_gain = 0;
|
|
flag_GoneOver = 1;
|
|
}
|
|
if (cod_info->global_gain > 255) {
|
|
cod_info->global_gain = 255;
|
|
flag_GoneOver = 1;
|
|
}
|
|
}
|
|
|
|
assert(cod_info->global_gain >= 0);
|
|
assert(cod_info->global_gain < 256);
|
|
|
|
while (nBits > desired_rate && cod_info->global_gain < 255) {
|
|
cod_info->global_gain++;
|
|
nBits = count_bits(gfc, xrpow, cod_info, 0);
|
|
}
|
|
gfc->sv_qnt.CurrentStep[ch] = (start - cod_info->global_gain >= 4) ? 4 : 2;
|
|
gfc->sv_qnt.OldValue[ch] = cod_info->global_gain;
|
|
cod_info->part2_3_length = nBits;
|
|
return nBits;
|
|
}
|
|
|
|
|
|
|
|
|
|
/************************************************************************
|
|
*
|
|
* trancate_smallspectrums()
|
|
*
|
|
* Takehiro TOMINAGA 2002-07-21
|
|
*
|
|
* trancate smaller nubmers into 0 as long as the noise threshold is allowed.
|
|
*
|
|
************************************************************************/
|
|
static int
|
|
floatcompare(const void *v1, const void *v2)
|
|
{
|
|
const FLOAT *const a = v1, *const b = v2;
|
|
if (*a > *b)
|
|
return 1;
|
|
if (*a < *b)
|
|
return -1;
|
|
return 0;
|
|
}
|
|
|
|
static void
|
|
trancate_smallspectrums(lame_internal_flags const *gfc,
|
|
gr_info * const gi, const FLOAT * const l3_xmin, FLOAT * const work)
|
|
{
|
|
int sfb, j, width;
|
|
FLOAT distort[SFBMAX];
|
|
calc_noise_result dummy;
|
|
|
|
if ((!(gfc->sv_qnt.substep_shaping & 4) && gi->block_type == SHORT_TYPE)
|
|
|| gfc->sv_qnt.substep_shaping & 0x80)
|
|
return;
|
|
(void) calc_noise(gi, l3_xmin, distort, &dummy, 0);
|
|
for (j = 0; j < 576; j++) {
|
|
FLOAT xr = 0.0;
|
|
if (gi->l3_enc[j] != 0)
|
|
xr = fabs(gi->xr[j]);
|
|
work[j] = xr;
|
|
}
|
|
|
|
j = 0;
|
|
sfb = 8;
|
|
if (gi->block_type == SHORT_TYPE)
|
|
sfb = 6;
|
|
do {
|
|
FLOAT allowedNoise, trancateThreshold;
|
|
int nsame, start;
|
|
|
|
width = gi->width[sfb];
|
|
j += width;
|
|
if (distort[sfb] >= 1.0)
|
|
continue;
|
|
|
|
qsort(&work[j - width], width, sizeof(FLOAT), floatcompare);
|
|
if (EQ(work[j - 1], 0.0))
|
|
continue; /* all zero sfb */
|
|
|
|
allowedNoise = (1.0 - distort[sfb]) * l3_xmin[sfb];
|
|
trancateThreshold = 0.0;
|
|
start = 0;
|
|
do {
|
|
FLOAT noise;
|
|
for (nsame = 1; start + nsame < width; nsame++)
|
|
if (NEQ(work[start + j - width], work[start + j + nsame - width]))
|
|
break;
|
|
|
|
noise = work[start + j - width] * work[start + j - width] * nsame;
|
|
if (allowedNoise < noise) {
|
|
if (start != 0)
|
|
trancateThreshold = work[start + j - width - 1];
|
|
break;
|
|
}
|
|
allowedNoise -= noise;
|
|
start += nsame;
|
|
} while (start < width);
|
|
if (EQ(trancateThreshold, 0.0))
|
|
continue;
|
|
|
|
/* printf("%e %e %e\n", */
|
|
/* trancateThreshold/l3_xmin[sfb], */
|
|
/* trancateThreshold/(l3_xmin[sfb]*start), */
|
|
/* trancateThreshold/(l3_xmin[sfb]*(start+width)) */
|
|
/* ); */
|
|
/* if (trancateThreshold > 1000*l3_xmin[sfb]*start) */
|
|
/* trancateThreshold = 1000*l3_xmin[sfb]*start; */
|
|
|
|
do {
|
|
if (fabs(gi->xr[j - width]) <= trancateThreshold)
|
|
gi->l3_enc[j - width] = 0;
|
|
} while (--width > 0);
|
|
} while (++sfb < gi->psymax);
|
|
|
|
gi->part2_3_length = noquant_count_bits(gfc, gi, 0);
|
|
}
|
|
|
|
|
|
/*************************************************************************
|
|
*
|
|
* loop_break()
|
|
*
|
|
* author/date??
|
|
*
|
|
* Function: Returns zero if there is a scalefac which has not been
|
|
* amplified. Otherwise it returns one.
|
|
*
|
|
*************************************************************************/
|
|
|
|
inline static int
|
|
loop_break(const gr_info * const cod_info)
|
|
{
|
|
int sfb;
|
|
|
|
for (sfb = 0; sfb < cod_info->sfbmax; sfb++)
|
|
if (cod_info->scalefac[sfb]
|
|
+ cod_info->subblock_gain[cod_info->window[sfb]] == 0)
|
|
return 0;
|
|
|
|
return 1;
|
|
}
|
|
|
|
|
|
|
|
|
|
/* mt 5/99: Function: Improved calc_noise for a single channel */
|
|
|
|
/*************************************************************************
|
|
*
|
|
* quant_compare()
|
|
*
|
|
* author/date??
|
|
*
|
|
* several different codes to decide which quantization is better
|
|
*
|
|
*************************************************************************/
|
|
|
|
static double
|
|
penalties(double noise)
|
|
{
|
|
return FAST_LOG10(0.368 + 0.632 * noise * noise * noise);
|
|
}
|
|
|
|
static double
|
|
get_klemm_noise(const FLOAT * distort, const gr_info * const gi)
|
|
{
|
|
int sfb;
|
|
double klemm_noise = 1E-37;
|
|
for (sfb = 0; sfb < gi->psymax; sfb++)
|
|
klemm_noise += penalties(distort[sfb]);
|
|
|
|
return Max(1e-20, klemm_noise);
|
|
}
|
|
|
|
inline static int
|
|
quant_compare(const int quant_comp,
|
|
const calc_noise_result * const best,
|
|
calc_noise_result * const calc, const gr_info * const gi, const FLOAT * distort)
|
|
{
|
|
/*
|
|
noise is given in decibels (dB) relative to masking thesholds.
|
|
|
|
over_noise: ??? (the previous comment is fully wrong)
|
|
tot_noise: ??? (the previous comment is fully wrong)
|
|
max_noise: max quantization noise
|
|
|
|
*/
|
|
int better;
|
|
|
|
switch (quant_comp) {
|
|
default:
|
|
case 9:{
|
|
if (best->over_count > 0) {
|
|
/* there are distorted sfb */
|
|
better = calc->over_SSD <= best->over_SSD;
|
|
if (calc->over_SSD == best->over_SSD)
|
|
better = calc->bits < best->bits;
|
|
}
|
|
else {
|
|
/* no distorted sfb */
|
|
better = ((calc->max_noise < 0) &&
|
|
((calc->max_noise * 10 + calc->bits) <=
|
|
(best->max_noise * 10 + best->bits)));
|
|
}
|
|
break;
|
|
}
|
|
|
|
case 0:
|
|
better = calc->over_count < best->over_count
|
|
|| (calc->over_count == best->over_count && calc->over_noise < best->over_noise)
|
|
|| (calc->over_count == best->over_count &&
|
|
EQ(calc->over_noise, best->over_noise) && calc->tot_noise < best->tot_noise);
|
|
break;
|
|
|
|
case 8:
|
|
calc->max_noise = get_klemm_noise(distort, gi);
|
|
/*lint --fallthrough */
|
|
case 1:
|
|
better = calc->max_noise < best->max_noise;
|
|
break;
|
|
case 2:
|
|
better = calc->tot_noise < best->tot_noise;
|
|
break;
|
|
case 3:
|
|
better = (calc->tot_noise < best->tot_noise)
|
|
&& (calc->max_noise < best->max_noise);
|
|
break;
|
|
case 4:
|
|
better = (calc->max_noise <= 0.0 && best->max_noise > 0.2)
|
|
|| (calc->max_noise <= 0.0 &&
|
|
best->max_noise < 0.0 &&
|
|
best->max_noise > calc->max_noise - 0.2 && calc->tot_noise < best->tot_noise)
|
|
|| (calc->max_noise <= 0.0 &&
|
|
best->max_noise > 0.0 &&
|
|
best->max_noise > calc->max_noise - 0.2 &&
|
|
calc->tot_noise < best->tot_noise + best->over_noise)
|
|
|| (calc->max_noise > 0.0 &&
|
|
best->max_noise > -0.05 &&
|
|
best->max_noise > calc->max_noise - 0.1 &&
|
|
calc->tot_noise + calc->over_noise < best->tot_noise + best->over_noise)
|
|
|| (calc->max_noise > 0.0 &&
|
|
best->max_noise > -0.1 &&
|
|
best->max_noise > calc->max_noise - 0.15 &&
|
|
calc->tot_noise + calc->over_noise + calc->over_noise <
|
|
best->tot_noise + best->over_noise + best->over_noise);
|
|
break;
|
|
case 5:
|
|
better = calc->over_noise < best->over_noise
|
|
|| (EQ(calc->over_noise, best->over_noise) && calc->tot_noise < best->tot_noise);
|
|
break;
|
|
case 6:
|
|
better = calc->over_noise < best->over_noise
|
|
|| (EQ(calc->over_noise, best->over_noise) &&
|
|
(calc->max_noise < best->max_noise
|
|
|| (EQ(calc->max_noise, best->max_noise) && calc->tot_noise <= best->tot_noise)
|
|
));
|
|
break;
|
|
case 7:
|
|
better = calc->over_count < best->over_count || calc->over_noise < best->over_noise;
|
|
break;
|
|
}
|
|
|
|
|
|
if (best->over_count == 0) {
|
|
/*
|
|
If no distorted bands, only use this quantization
|
|
if it is better, and if it uses less bits.
|
|
Unfortunately, part2_3_length is sometimes a poor
|
|
estimator of the final size at low bitrates.
|
|
*/
|
|
better = better && calc->bits < best->bits;
|
|
}
|
|
|
|
|
|
return better;
|
|
}
|
|
|
|
|
|
|
|
/*************************************************************************
|
|
*
|
|
* amp_scalefac_bands()
|
|
*
|
|
* author/date??
|
|
*
|
|
* Amplify the scalefactor bands that violate the masking threshold.
|
|
* See ISO 11172-3 Section C.1.5.4.3.5
|
|
*
|
|
* distort[] = noise/masking
|
|
* distort[] > 1 ==> noise is not masked
|
|
* distort[] < 1 ==> noise is masked
|
|
* max_dist = maximum value of distort[]
|
|
*
|
|
* Three algorithms:
|
|
* noise_shaping_amp
|
|
* 0 Amplify all bands with distort[]>1.
|
|
*
|
|
* 1 Amplify all bands with distort[] >= max_dist^(.5);
|
|
* ( 50% in the db scale)
|
|
*
|
|
* 2 Amplify first band with distort[] >= max_dist;
|
|
*
|
|
*
|
|
* For algorithms 0 and 1, if max_dist < 1, then amplify all bands
|
|
* with distort[] >= .95*max_dist. This is to make sure we always
|
|
* amplify at least one band.
|
|
*
|
|
*
|
|
*************************************************************************/
|
|
static void
|
|
amp_scalefac_bands(lame_internal_flags * gfc,
|
|
gr_info * const cod_info, FLOAT const *distort, FLOAT xrpow[576], int bRefine)
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
int j, sfb;
|
|
FLOAT ifqstep34, trigger;
|
|
int noise_shaping_amp;
|
|
|
|
if (cod_info->scalefac_scale == 0) {
|
|
ifqstep34 = 1.29683955465100964055; /* 2**(.75*.5) */
|
|
}
|
|
else {
|
|
ifqstep34 = 1.68179283050742922612; /* 2**(.75*1) */
|
|
}
|
|
|
|
/* compute maximum value of distort[] */
|
|
trigger = 0;
|
|
for (sfb = 0; sfb < cod_info->sfbmax; sfb++) {
|
|
if (trigger < distort[sfb])
|
|
trigger = distort[sfb];
|
|
}
|
|
|
|
noise_shaping_amp = cfg->noise_shaping_amp;
|
|
if (noise_shaping_amp == 3) {
|
|
if (bRefine == 1)
|
|
noise_shaping_amp = 2;
|
|
else
|
|
noise_shaping_amp = 1;
|
|
}
|
|
switch (noise_shaping_amp) {
|
|
case 2:
|
|
/* amplify exactly 1 band */
|
|
break;
|
|
|
|
case 1:
|
|
/* amplify bands within 50% of max (on db scale) */
|
|
if (trigger > 1.0)
|
|
trigger = pow(trigger, .5);
|
|
else
|
|
trigger *= .95;
|
|
break;
|
|
|
|
case 0:
|
|
default:
|
|
/* ISO algorithm. amplify all bands with distort>1 */
|
|
if (trigger > 1.0)
|
|
trigger = 1.0;
|
|
else
|
|
trigger *= .95;
|
|
break;
|
|
}
|
|
|
|
j = 0;
|
|
for (sfb = 0; sfb < cod_info->sfbmax; sfb++) {
|
|
int const width = cod_info->width[sfb];
|
|
int l;
|
|
j += width;
|
|
if (distort[sfb] < trigger)
|
|
continue;
|
|
|
|
if (gfc->sv_qnt.substep_shaping & 2) {
|
|
gfc->sv_qnt.pseudohalf[sfb] = !gfc->sv_qnt.pseudohalf[sfb];
|
|
if (!gfc->sv_qnt.pseudohalf[sfb] && cfg->noise_shaping_amp == 2)
|
|
return;
|
|
}
|
|
cod_info->scalefac[sfb]++;
|
|
for (l = -width; l < 0; l++) {
|
|
xrpow[j + l] *= ifqstep34;
|
|
if (xrpow[j + l] > cod_info->xrpow_max)
|
|
cod_info->xrpow_max = xrpow[j + l];
|
|
}
|
|
|
|
if (cfg->noise_shaping_amp == 2)
|
|
return;
|
|
}
|
|
}
|
|
|
|
/*************************************************************************
|
|
*
|
|
* inc_scalefac_scale()
|
|
*
|
|
* Takehiro Tominaga 2000-xx-xx
|
|
*
|
|
* turns on scalefac scale and adjusts scalefactors
|
|
*
|
|
*************************************************************************/
|
|
|
|
static void
|
|
inc_scalefac_scale(gr_info * const cod_info, FLOAT xrpow[576])
|
|
{
|
|
int l, j, sfb;
|
|
const FLOAT ifqstep34 = 1.29683955465100964055;
|
|
|
|
j = 0;
|
|
for (sfb = 0; sfb < cod_info->sfbmax; sfb++) {
|
|
int const width = cod_info->width[sfb];
|
|
int s = cod_info->scalefac[sfb];
|
|
if (cod_info->preflag)
|
|
s += pretab[sfb];
|
|
j += width;
|
|
if (s & 1) {
|
|
s++;
|
|
for (l = -width; l < 0; l++) {
|
|
xrpow[j + l] *= ifqstep34;
|
|
if (xrpow[j + l] > cod_info->xrpow_max)
|
|
cod_info->xrpow_max = xrpow[j + l];
|
|
}
|
|
}
|
|
cod_info->scalefac[sfb] = s >> 1;
|
|
}
|
|
cod_info->preflag = 0;
|
|
cod_info->scalefac_scale = 1;
|
|
}
|
|
|
|
|
|
|
|
/*************************************************************************
|
|
*
|
|
* inc_subblock_gain()
|
|
*
|
|
* Takehiro Tominaga 2000-xx-xx
|
|
*
|
|
* increases the subblock gain and adjusts scalefactors
|
|
*
|
|
*************************************************************************/
|
|
|
|
static int
|
|
inc_subblock_gain(const lame_internal_flags * const gfc, gr_info * const cod_info, FLOAT xrpow[576])
|
|
{
|
|
int sfb, window;
|
|
int *const scalefac = cod_info->scalefac;
|
|
|
|
/* subbloc_gain can't do anything in the long block region */
|
|
for (sfb = 0; sfb < cod_info->sfb_lmax; sfb++) {
|
|
if (scalefac[sfb] >= 16)
|
|
return 1;
|
|
}
|
|
|
|
for (window = 0; window < 3; window++) {
|
|
int s1, s2, l, j;
|
|
s1 = s2 = 0;
|
|
|
|
for (sfb = cod_info->sfb_lmax + window; sfb < cod_info->sfbdivide; sfb += 3) {
|
|
if (s1 < scalefac[sfb])
|
|
s1 = scalefac[sfb];
|
|
}
|
|
for (; sfb < cod_info->sfbmax; sfb += 3) {
|
|
if (s2 < scalefac[sfb])
|
|
s2 = scalefac[sfb];
|
|
}
|
|
|
|
if (s1 < 16 && s2 < 8)
|
|
continue;
|
|
|
|
if (cod_info->subblock_gain[window] >= 7)
|
|
return 1;
|
|
|
|
/* even though there is no scalefactor for sfb12
|
|
* subblock gain affects upper frequencies too, that's why
|
|
* we have to go up to SBMAX_s
|
|
*/
|
|
cod_info->subblock_gain[window]++;
|
|
j = gfc->scalefac_band.l[cod_info->sfb_lmax];
|
|
for (sfb = cod_info->sfb_lmax + window; sfb < cod_info->sfbmax; sfb += 3) {
|
|
FLOAT amp;
|
|
int const width = cod_info->width[sfb];
|
|
int s = scalefac[sfb];
|
|
assert(s >= 0);
|
|
s = s - (4 >> cod_info->scalefac_scale);
|
|
if (s >= 0) {
|
|
scalefac[sfb] = s;
|
|
j += width * 3;
|
|
continue;
|
|
}
|
|
|
|
scalefac[sfb] = 0;
|
|
{
|
|
int const gain = 210 + (s << (cod_info->scalefac_scale + 1));
|
|
amp = IPOW20(gain);
|
|
}
|
|
j += width * (window + 1);
|
|
for (l = -width; l < 0; l++) {
|
|
xrpow[j + l] *= amp;
|
|
if (xrpow[j + l] > cod_info->xrpow_max)
|
|
cod_info->xrpow_max = xrpow[j + l];
|
|
}
|
|
j += width * (3 - window - 1);
|
|
}
|
|
|
|
{
|
|
FLOAT const amp = IPOW20(202);
|
|
j += cod_info->width[sfb] * (window + 1);
|
|
for (l = -cod_info->width[sfb]; l < 0; l++) {
|
|
xrpow[j + l] *= amp;
|
|
if (xrpow[j + l] > cod_info->xrpow_max)
|
|
cod_info->xrpow_max = xrpow[j + l];
|
|
}
|
|
}
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
|
|
|
|
/********************************************************************
|
|
*
|
|
* balance_noise()
|
|
*
|
|
* Takehiro Tominaga /date??
|
|
* Robert Hegemann 2000-09-06: made a function of it
|
|
*
|
|
* amplifies scalefactor bands,
|
|
* - if all are already amplified returns 0
|
|
* - if some bands are amplified too much:
|
|
* * try to increase scalefac_scale
|
|
* * if already scalefac_scale was set
|
|
* try on short blocks to increase subblock gain
|
|
*
|
|
********************************************************************/
|
|
inline static int
|
|
balance_noise(lame_internal_flags * gfc,
|
|
gr_info * const cod_info, FLOAT const *distort, FLOAT xrpow[576], int bRefine)
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
int status;
|
|
|
|
amp_scalefac_bands(gfc, cod_info, distort, xrpow, bRefine);
|
|
|
|
/* check to make sure we have not amplified too much
|
|
* loop_break returns 0 if there is an unamplified scalefac
|
|
* scale_bitcount returns 0 if no scalefactors are too large
|
|
*/
|
|
|
|
status = loop_break(cod_info);
|
|
|
|
if (status)
|
|
return 0; /* all bands amplified */
|
|
|
|
/* not all scalefactors have been amplified. so these
|
|
* scalefacs are possibly valid. encode them:
|
|
*/
|
|
status = scale_bitcount(gfc, cod_info);
|
|
|
|
if (!status)
|
|
return 1; /* amplified some bands not exceeding limits */
|
|
|
|
/* some scalefactors are too large.
|
|
* lets try setting scalefac_scale=1
|
|
*/
|
|
if (cfg->noise_shaping > 1) {
|
|
memset(&gfc->sv_qnt.pseudohalf[0], 0, sizeof(gfc->sv_qnt.pseudohalf));
|
|
if (!cod_info->scalefac_scale) {
|
|
inc_scalefac_scale(cod_info, xrpow);
|
|
status = 0;
|
|
}
|
|
else {
|
|
if (cod_info->block_type == SHORT_TYPE && cfg->subblock_gain > 0) {
|
|
status = inc_subblock_gain(gfc, cod_info, xrpow)
|
|
|| loop_break(cod_info);
|
|
}
|
|
}
|
|
}
|
|
|
|
if (!status) {
|
|
status = scale_bitcount(gfc, cod_info);
|
|
}
|
|
return !status;
|
|
}
|
|
|
|
|
|
|
|
/************************************************************************
|
|
*
|
|
* outer_loop ()
|
|
*
|
|
* Function: The outer iteration loop controls the masking conditions
|
|
* of all scalefactorbands. It computes the best scalefac and
|
|
* global gain. This module calls the inner iteration loop
|
|
*
|
|
* mt 5/99 completely rewritten to allow for bit reservoir control,
|
|
* mid/side channels with L/R or mid/side masking thresholds,
|
|
* and chooses best quantization instead of last quantization when
|
|
* no distortion free quantization can be found.
|
|
*
|
|
* added VBR support mt 5/99
|
|
*
|
|
* some code shuffle rh 9/00
|
|
************************************************************************/
|
|
|
|
static int
|
|
outer_loop(lame_internal_flags * gfc, gr_info * const cod_info, const FLOAT * const l3_xmin, /* allowed distortion */
|
|
FLOAT xrpow[576], /* coloured magnitudes of spectral */
|
|
const int ch, const int targ_bits)
|
|
{ /* maximum allowed bits */
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
gr_info cod_info_w;
|
|
FLOAT save_xrpow[576];
|
|
FLOAT distort[SFBMAX];
|
|
calc_noise_result best_noise_info;
|
|
int huff_bits;
|
|
int better;
|
|
int age;
|
|
calc_noise_data prev_noise;
|
|
int best_part2_3_length = 9999999;
|
|
int bEndOfSearch = 0;
|
|
int bRefine = 0;
|
|
int best_ggain_pass1 = 0;
|
|
|
|
(void) bin_search_StepSize(gfc, cod_info, targ_bits, ch, xrpow);
|
|
|
|
if (!cfg->noise_shaping)
|
|
/* fast mode, no noise shaping, we are ready */
|
|
return 100; /* default noise_info.over_count */
|
|
|
|
memset(&prev_noise, 0, sizeof(calc_noise_data));
|
|
|
|
|
|
/* compute the distortion in this quantization */
|
|
/* coefficients and thresholds both l/r (or both mid/side) */
|
|
(void) calc_noise(cod_info, l3_xmin, distort, &best_noise_info, &prev_noise);
|
|
best_noise_info.bits = cod_info->part2_3_length;
|
|
|
|
cod_info_w = *cod_info;
|
|
age = 0;
|
|
/* if (cfg->vbr == vbr_rh || cfg->vbr == vbr_mtrh) */
|
|
memcpy(save_xrpow, xrpow, sizeof(FLOAT) * 576);
|
|
|
|
while (!bEndOfSearch) {
|
|
/* BEGIN MAIN LOOP */
|
|
do {
|
|
calc_noise_result noise_info;
|
|
int search_limit;
|
|
int maxggain = 255;
|
|
|
|
/* When quantization with no distorted bands is found,
|
|
* allow up to X new unsuccesful tries in serial. This
|
|
* gives us more possibilities for different quant_compare modes.
|
|
* Much more than 3 makes not a big difference, it is only slower.
|
|
*/
|
|
|
|
if (gfc->sv_qnt.substep_shaping & 2) {
|
|
search_limit = 20;
|
|
}
|
|
else {
|
|
search_limit = 3;
|
|
}
|
|
|
|
|
|
|
|
/* Check if the last scalefactor band is distorted.
|
|
* in VBR mode we can't get rid of the distortion, so quit now
|
|
* and VBR mode will try again with more bits.
|
|
* (makes a 10% speed increase, the files I tested were
|
|
* binary identical, 2000/05/20 Robert Hegemann)
|
|
* distort[] > 1 means noise > allowed noise
|
|
*/
|
|
if (gfc->sv_qnt.sfb21_extra) {
|
|
if (distort[cod_info_w.sfbmax] > 1.0)
|
|
break;
|
|
if (cod_info_w.block_type == SHORT_TYPE
|
|
&& (distort[cod_info_w.sfbmax + 1] > 1.0
|
|
|| distort[cod_info_w.sfbmax + 2] > 1.0))
|
|
break;
|
|
}
|
|
|
|
/* try a new scalefactor conbination on cod_info_w */
|
|
if (balance_noise(gfc, &cod_info_w, distort, xrpow, bRefine) == 0)
|
|
break;
|
|
if (cod_info_w.scalefac_scale)
|
|
maxggain = 254;
|
|
|
|
/* inner_loop starts with the initial quantization step computed above
|
|
* and slowly increases until the bits < huff_bits.
|
|
* Thus it is important not to start with too large of an inital
|
|
* quantization step. Too small is ok, but inner_loop will take longer
|
|
*/
|
|
huff_bits = targ_bits - cod_info_w.part2_length;
|
|
if (huff_bits <= 0)
|
|
break;
|
|
|
|
/* increase quantizer stepsize until needed bits are below maximum
|
|
*/
|
|
while ((cod_info_w.part2_3_length
|
|
= count_bits(gfc, xrpow, &cod_info_w, &prev_noise)) > huff_bits
|
|
&& cod_info_w.global_gain <= maxggain)
|
|
cod_info_w.global_gain++;
|
|
|
|
if (cod_info_w.global_gain > maxggain)
|
|
break;
|
|
|
|
if (best_noise_info.over_count == 0) {
|
|
|
|
while ((cod_info_w.part2_3_length
|
|
= count_bits(gfc, xrpow, &cod_info_w, &prev_noise)) > best_part2_3_length
|
|
&& cod_info_w.global_gain <= maxggain)
|
|
cod_info_w.global_gain++;
|
|
|
|
if (cod_info_w.global_gain > maxggain)
|
|
break;
|
|
}
|
|
|
|
/* compute the distortion in this quantization */
|
|
(void) calc_noise(&cod_info_w, l3_xmin, distort, &noise_info, &prev_noise);
|
|
noise_info.bits = cod_info_w.part2_3_length;
|
|
|
|
/* check if this quantization is better
|
|
* than our saved quantization */
|
|
if (cod_info->block_type != SHORT_TYPE) /* NORM, START or STOP type */
|
|
better = cfg->quant_comp;
|
|
else
|
|
better = cfg->quant_comp_short;
|
|
|
|
|
|
better = quant_compare(better, &best_noise_info, &noise_info, &cod_info_w, distort);
|
|
|
|
|
|
/* save data so we can restore this quantization later */
|
|
if (better) {
|
|
best_part2_3_length = cod_info->part2_3_length;
|
|
best_noise_info = noise_info;
|
|
*cod_info = cod_info_w;
|
|
age = 0;
|
|
/* save data so we can restore this quantization later */
|
|
/*if (cfg->vbr == vbr_rh || cfg->vbr == vbr_mtrh) */ {
|
|
/* store for later reuse */
|
|
memcpy(save_xrpow, xrpow, sizeof(FLOAT) * 576);
|
|
}
|
|
}
|
|
else {
|
|
/* early stop? */
|
|
if (cfg->full_outer_loop == 0) {
|
|
if (++age > search_limit && best_noise_info.over_count == 0)
|
|
break;
|
|
if ((cfg->noise_shaping_amp == 3) && bRefine && age > 30)
|
|
break;
|
|
if ((cfg->noise_shaping_amp == 3) && bRefine &&
|
|
(cod_info_w.global_gain - best_ggain_pass1) > 15)
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
while ((cod_info_w.global_gain + cod_info_w.scalefac_scale) < 255);
|
|
|
|
if (cfg->noise_shaping_amp == 3) {
|
|
if (!bRefine) {
|
|
/* refine search */
|
|
cod_info_w = *cod_info;
|
|
memcpy(xrpow, save_xrpow, sizeof(FLOAT) * 576);
|
|
age = 0;
|
|
best_ggain_pass1 = cod_info_w.global_gain;
|
|
|
|
bRefine = 1;
|
|
}
|
|
else {
|
|
/* search already refined, stop */
|
|
bEndOfSearch = 1;
|
|
}
|
|
|
|
}
|
|
else {
|
|
bEndOfSearch = 1;
|
|
}
|
|
}
|
|
|
|
assert((cod_info->global_gain + cod_info->scalefac_scale) <= 255);
|
|
/* finish up
|
|
*/
|
|
if (cfg->vbr == vbr_rh || cfg->vbr == vbr_mtrh || cfg->vbr == vbr_mt)
|
|
/* restore for reuse on next try */
|
|
memcpy(xrpow, save_xrpow, sizeof(FLOAT) * 576);
|
|
/* do the 'substep shaping'
|
|
*/
|
|
else if (gfc->sv_qnt.substep_shaping & 1)
|
|
trancate_smallspectrums(gfc, cod_info, l3_xmin, xrpow);
|
|
|
|
return best_noise_info.over_count;
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/************************************************************************
|
|
*
|
|
* iteration_finish_one()
|
|
*
|
|
* Robert Hegemann 2000-09-06
|
|
*
|
|
* update reservoir status after FINAL quantization/bitrate
|
|
*
|
|
************************************************************************/
|
|
|
|
static void
|
|
iteration_finish_one(lame_internal_flags * gfc, int gr, int ch)
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
III_side_info_t *const l3_side = &gfc->l3_side;
|
|
gr_info *const cod_info = &l3_side->tt[gr][ch];
|
|
|
|
/* try some better scalefac storage
|
|
*/
|
|
best_scalefac_store(gfc, gr, ch, l3_side);
|
|
|
|
/* best huffman_divide may save some bits too
|
|
*/
|
|
if (cfg->use_best_huffman == 1)
|
|
best_huffman_divide(gfc, cod_info);
|
|
|
|
/* update reservoir status after FINAL quantization/bitrate
|
|
*/
|
|
ResvAdjust(gfc, cod_info);
|
|
}
|
|
|
|
|
|
|
|
/*********************************************************************
|
|
*
|
|
* VBR_encode_granule()
|
|
*
|
|
* 2000-09-04 Robert Hegemann
|
|
*
|
|
*********************************************************************/
|
|
|
|
static void
|
|
VBR_encode_granule(lame_internal_flags * gfc, gr_info * const cod_info, const FLOAT * const l3_xmin, /* allowed distortion of the scalefactor */
|
|
FLOAT xrpow[576], /* coloured magnitudes of spectral values */
|
|
const int ch, int min_bits, int max_bits)
|
|
{
|
|
gr_info bst_cod_info;
|
|
FLOAT bst_xrpow[576];
|
|
int const Max_bits = max_bits;
|
|
int real_bits = max_bits + 1;
|
|
int this_bits = (max_bits + min_bits) / 2;
|
|
int dbits, over, found = 0;
|
|
int const sfb21_extra = gfc->sv_qnt.sfb21_extra;
|
|
|
|
assert(Max_bits <= MAX_BITS_PER_CHANNEL);
|
|
memset(bst_cod_info.l3_enc, 0, sizeof(bst_cod_info.l3_enc));
|
|
|
|
/* search within round about 40 bits of optimal
|
|
*/
|
|
do {
|
|
assert(this_bits >= min_bits);
|
|
assert(this_bits <= max_bits);
|
|
assert(min_bits <= max_bits);
|
|
|
|
if (this_bits > Max_bits - 42)
|
|
gfc->sv_qnt.sfb21_extra = 0;
|
|
else
|
|
gfc->sv_qnt.sfb21_extra = sfb21_extra;
|
|
|
|
over = outer_loop(gfc, cod_info, l3_xmin, xrpow, ch, this_bits);
|
|
|
|
/* is quantization as good as we are looking for ?
|
|
* in this case: is no scalefactor band distorted?
|
|
*/
|
|
if (over <= 0) {
|
|
found = 1;
|
|
/* now we know it can be done with "real_bits"
|
|
* and maybe we can skip some iterations
|
|
*/
|
|
real_bits = cod_info->part2_3_length;
|
|
|
|
/* store best quantization so far
|
|
*/
|
|
bst_cod_info = *cod_info;
|
|
memcpy(bst_xrpow, xrpow, sizeof(FLOAT) * 576);
|
|
|
|
/* try with fewer bits
|
|
*/
|
|
max_bits = real_bits - 32;
|
|
dbits = max_bits - min_bits;
|
|
this_bits = (max_bits + min_bits) / 2;
|
|
}
|
|
else {
|
|
/* try with more bits
|
|
*/
|
|
min_bits = this_bits + 32;
|
|
dbits = max_bits - min_bits;
|
|
this_bits = (max_bits + min_bits) / 2;
|
|
|
|
if (found) {
|
|
found = 2;
|
|
/* start again with best quantization so far
|
|
*/
|
|
*cod_info = bst_cod_info;
|
|
memcpy(xrpow, bst_xrpow, sizeof(FLOAT) * 576);
|
|
}
|
|
}
|
|
} while (dbits > 12);
|
|
|
|
gfc->sv_qnt.sfb21_extra = sfb21_extra;
|
|
|
|
/* found=0 => nothing found, use last one
|
|
* found=1 => we just found the best and left the loop
|
|
* found=2 => we restored a good one and have now l3_enc to restore too
|
|
*/
|
|
if (found == 2) {
|
|
memcpy(cod_info->l3_enc, bst_cod_info.l3_enc, sizeof(int) * 576);
|
|
}
|
|
assert(cod_info->part2_3_length <= Max_bits);
|
|
|
|
}
|
|
|
|
|
|
|
|
/************************************************************************
|
|
*
|
|
* get_framebits()
|
|
*
|
|
* Robert Hegemann 2000-09-05
|
|
*
|
|
* calculates
|
|
* * how many bits are available for analog silent granules
|
|
* * how many bits to use for the lowest allowed bitrate
|
|
* * how many bits each bitrate would provide
|
|
*
|
|
************************************************************************/
|
|
|
|
static void
|
|
get_framebits(lame_internal_flags * gfc, int frameBits[15])
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
EncResult_t *const eov = &gfc->ov_enc;
|
|
int bitsPerFrame, i;
|
|
|
|
/* always use at least this many bits per granule per channel
|
|
* unless we detect analog silence, see below
|
|
*/
|
|
eov->bitrate_index = cfg->vbr_min_bitrate_index;
|
|
bitsPerFrame = getframebits(gfc);
|
|
|
|
/* bits for analog silence
|
|
*/
|
|
eov->bitrate_index = 1;
|
|
bitsPerFrame = getframebits(gfc);
|
|
|
|
for (i = 1; i <= cfg->vbr_max_bitrate_index; i++) {
|
|
eov->bitrate_index = i;
|
|
frameBits[i] = ResvFrameBegin(gfc, &bitsPerFrame);
|
|
}
|
|
}
|
|
|
|
|
|
|
|
/*********************************************************************
|
|
*
|
|
* VBR_prepare()
|
|
*
|
|
* 2000-09-04 Robert Hegemann
|
|
*
|
|
* * converts LR to MS coding when necessary
|
|
* * calculates allowed/adjusted quantization noise amounts
|
|
* * detects analog silent frames
|
|
*
|
|
* some remarks:
|
|
* - lower masking depending on Quality setting
|
|
* - quality control together with adjusted ATH MDCT scaling
|
|
* on lower quality setting allocate more noise from
|
|
* ATH masking, and on higher quality setting allocate
|
|
* less noise from ATH masking.
|
|
* - experiments show that going more than 2dB over GPSYCHO's
|
|
* limits ends up in very annoying artefacts
|
|
*
|
|
*********************************************************************/
|
|
|
|
/* RH: this one needs to be overhauled sometime */
|
|
|
|
static int
|
|
VBR_old_prepare(lame_internal_flags * gfc,
|
|
const FLOAT pe[2][2], FLOAT const ms_ener_ratio[2],
|
|
const III_psy_ratio ratio[2][2],
|
|
FLOAT l3_xmin[2][2][SFBMAX],
|
|
int frameBits[16], int min_bits[2][2], int max_bits[2][2], int bands[2][2])
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
EncResult_t *const eov = &gfc->ov_enc;
|
|
|
|
FLOAT masking_lower_db, adjust = 0.0;
|
|
int gr, ch;
|
|
int analog_silence = 1;
|
|
int avg, mxb, bits = 0;
|
|
|
|
eov->bitrate_index = cfg->vbr_max_bitrate_index;
|
|
avg = ResvFrameBegin(gfc, &avg) / cfg->mode_gr;
|
|
|
|
get_framebits(gfc, frameBits);
|
|
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
mxb = on_pe(gfc, pe, max_bits[gr], avg, gr, 0);
|
|
if (gfc->ov_enc.mode_ext == MPG_MD_MS_LR) {
|
|
ms_convert(&gfc->l3_side, gr);
|
|
reduce_side(max_bits[gr], ms_ener_ratio[gr], avg, mxb);
|
|
}
|
|
for (ch = 0; ch < cfg->channels_out; ++ch) {
|
|
gr_info *const cod_info = &gfc->l3_side.tt[gr][ch];
|
|
|
|
if (cod_info->block_type != SHORT_TYPE) { /* NORM, START or STOP type */
|
|
adjust = 1.28 / (1 + exp(3.5 - pe[gr][ch] / 300.)) - 0.05;
|
|
masking_lower_db = gfc->sv_qnt.mask_adjust - adjust;
|
|
}
|
|
else {
|
|
adjust = 2.56 / (1 + exp(3.5 - pe[gr][ch] / 300.)) - 0.14;
|
|
masking_lower_db = gfc->sv_qnt.mask_adjust_short - adjust;
|
|
}
|
|
gfc->sv_qnt.masking_lower = pow(10.0, masking_lower_db * 0.1);
|
|
|
|
init_outer_loop(gfc, cod_info);
|
|
bands[gr][ch] = calc_xmin(gfc, &ratio[gr][ch], cod_info, l3_xmin[gr][ch]);
|
|
if (bands[gr][ch])
|
|
analog_silence = 0;
|
|
|
|
min_bits[gr][ch] = 126;
|
|
|
|
bits += max_bits[gr][ch];
|
|
}
|
|
}
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
if (bits > frameBits[cfg->vbr_max_bitrate_index] && bits > 0) {
|
|
max_bits[gr][ch] *= frameBits[cfg->vbr_max_bitrate_index];
|
|
max_bits[gr][ch] /= bits;
|
|
}
|
|
if (min_bits[gr][ch] > max_bits[gr][ch])
|
|
min_bits[gr][ch] = max_bits[gr][ch];
|
|
|
|
} /* for ch */
|
|
} /* for gr */
|
|
|
|
return analog_silence;
|
|
}
|
|
|
|
static void
|
|
bitpressure_strategy(lame_internal_flags const *gfc,
|
|
FLOAT l3_xmin[2][2][SFBMAX], const int min_bits[2][2], int max_bits[2][2])
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
int gr, ch, sfb;
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
gr_info const *const gi = &gfc->l3_side.tt[gr][ch];
|
|
FLOAT *pxmin = l3_xmin[gr][ch];
|
|
for (sfb = 0; sfb < gi->psy_lmax; sfb++)
|
|
*pxmin++ *= 1. + .029 * sfb * sfb / SBMAX_l / SBMAX_l;
|
|
|
|
if (gi->block_type == SHORT_TYPE) {
|
|
for (sfb = gi->sfb_smin; sfb < SBMAX_s; sfb++) {
|
|
*pxmin++ *= 1. + .029 * sfb * sfb / SBMAX_s / SBMAX_s;
|
|
*pxmin++ *= 1. + .029 * sfb * sfb / SBMAX_s / SBMAX_s;
|
|
*pxmin++ *= 1. + .029 * sfb * sfb / SBMAX_s / SBMAX_s;
|
|
}
|
|
}
|
|
max_bits[gr][ch] = Max(min_bits[gr][ch], 0.9 * max_bits[gr][ch]);
|
|
}
|
|
}
|
|
}
|
|
|
|
/************************************************************************
|
|
*
|
|
* VBR_iteration_loop()
|
|
*
|
|
* tries to find out how many bits are needed for each granule and channel
|
|
* to get an acceptable quantization. An appropriate bitrate will then be
|
|
* choosed for quantization. rh 8/99
|
|
*
|
|
* Robert Hegemann 2000-09-06 rewrite
|
|
*
|
|
************************************************************************/
|
|
|
|
void
|
|
VBR_old_iteration_loop(lame_internal_flags * gfc, const FLOAT pe[2][2],
|
|
const FLOAT ms_ener_ratio[2], const III_psy_ratio ratio[2][2])
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
EncResult_t *const eov = &gfc->ov_enc;
|
|
FLOAT l3_xmin[2][2][SFBMAX];
|
|
|
|
FLOAT xrpow[576];
|
|
int bands[2][2];
|
|
int frameBits[15];
|
|
int used_bits;
|
|
int bits;
|
|
int min_bits[2][2], max_bits[2][2];
|
|
int mean_bits;
|
|
int ch, gr, analog_silence;
|
|
III_side_info_t *const l3_side = &gfc->l3_side;
|
|
|
|
analog_silence = VBR_old_prepare(gfc, pe, ms_ener_ratio, ratio,
|
|
l3_xmin, frameBits, min_bits, max_bits, bands);
|
|
|
|
/*---------------------------------*/
|
|
for (;;) {
|
|
|
|
/* quantize granules with lowest possible number of bits
|
|
*/
|
|
|
|
used_bits = 0;
|
|
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
int ret;
|
|
gr_info *const cod_info = &l3_side->tt[gr][ch];
|
|
|
|
/* init_outer_loop sets up cod_info, scalefac and xrpow
|
|
*/
|
|
ret = init_xrpow(gfc, cod_info, xrpow);
|
|
if (ret == 0 || max_bits[gr][ch] == 0) {
|
|
/* xr contains no energy
|
|
* l3_enc, our encoding data, will be quantized to zero
|
|
*/
|
|
continue; /* with next channel */
|
|
}
|
|
|
|
VBR_encode_granule(gfc, cod_info, l3_xmin[gr][ch], xrpow,
|
|
ch, min_bits[gr][ch], max_bits[gr][ch]);
|
|
|
|
/* do the 'substep shaping'
|
|
*/
|
|
if (gfc->sv_qnt.substep_shaping & 1) {
|
|
trancate_smallspectrums(gfc, &l3_side->tt[gr][ch], l3_xmin[gr][ch], xrpow);
|
|
}
|
|
|
|
ret = cod_info->part2_3_length + cod_info->part2_length;
|
|
used_bits += ret;
|
|
} /* for ch */
|
|
} /* for gr */
|
|
|
|
/* find lowest bitrate able to hold used bits
|
|
*/
|
|
if (analog_silence && !cfg->enforce_min_bitrate)
|
|
/* we detected analog silence and the user did not specify
|
|
* any hard framesize limit, so start with smallest possible frame
|
|
*/
|
|
eov->bitrate_index = 1;
|
|
else
|
|
eov->bitrate_index = cfg->vbr_min_bitrate_index;
|
|
|
|
for (; eov->bitrate_index < cfg->vbr_max_bitrate_index; eov->bitrate_index++) {
|
|
if (used_bits <= frameBits[eov->bitrate_index])
|
|
break;
|
|
}
|
|
bits = ResvFrameBegin(gfc, &mean_bits);
|
|
|
|
if (used_bits <= bits)
|
|
break;
|
|
|
|
bitpressure_strategy(gfc, l3_xmin, (const int (*)[2])min_bits, max_bits);
|
|
|
|
} /* breaks adjusted */
|
|
/*--------------------------------------*/
|
|
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
iteration_finish_one(gfc, gr, ch);
|
|
} /* for ch */
|
|
} /* for gr */
|
|
ResvFrameEnd(gfc, mean_bits);
|
|
}
|
|
|
|
|
|
|
|
static int
|
|
VBR_new_prepare(lame_internal_flags * gfc,
|
|
const FLOAT pe[2][2], const III_psy_ratio ratio[2][2],
|
|
FLOAT l3_xmin[2][2][SFBMAX], int frameBits[16], int max_bits[2][2],
|
|
int* max_resv)
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
EncResult_t *const eov = &gfc->ov_enc;
|
|
|
|
int gr, ch;
|
|
int analog_silence = 1;
|
|
int avg, bits = 0;
|
|
int maximum_framebits;
|
|
|
|
if (!cfg->free_format) {
|
|
eov->bitrate_index = cfg->vbr_max_bitrate_index;
|
|
(void) ResvFrameBegin(gfc, &avg);
|
|
*max_resv = gfc->sv_enc.ResvMax;
|
|
|
|
get_framebits(gfc, frameBits);
|
|
maximum_framebits = frameBits[cfg->vbr_max_bitrate_index];
|
|
}
|
|
else {
|
|
eov->bitrate_index = 0;
|
|
maximum_framebits = ResvFrameBegin(gfc, &avg);
|
|
frameBits[0] = maximum_framebits;
|
|
*max_resv = gfc->sv_enc.ResvMax;
|
|
}
|
|
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
(void) on_pe(gfc, pe, max_bits[gr], avg, gr, 0);
|
|
if (gfc->ov_enc.mode_ext == MPG_MD_MS_LR) {
|
|
ms_convert(&gfc->l3_side, gr);
|
|
}
|
|
for (ch = 0; ch < cfg->channels_out; ++ch) {
|
|
gr_info *const cod_info = &gfc->l3_side.tt[gr][ch];
|
|
|
|
gfc->sv_qnt.masking_lower = pow(10.0, gfc->sv_qnt.mask_adjust * 0.1);
|
|
|
|
init_outer_loop(gfc, cod_info);
|
|
if (0 != calc_xmin(gfc, &ratio[gr][ch], cod_info, l3_xmin[gr][ch]))
|
|
analog_silence = 0;
|
|
|
|
bits += max_bits[gr][ch];
|
|
}
|
|
}
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
if (bits > maximum_framebits && bits > 0) {
|
|
max_bits[gr][ch] *= maximum_framebits;
|
|
max_bits[gr][ch] /= bits;
|
|
}
|
|
|
|
} /* for ch */
|
|
} /* for gr */
|
|
if (analog_silence) {
|
|
*max_resv = 0;
|
|
}
|
|
return analog_silence;
|
|
}
|
|
|
|
|
|
|
|
void
|
|
VBR_new_iteration_loop(lame_internal_flags * gfc, const FLOAT pe[2][2],
|
|
const FLOAT ms_ener_ratio[2], const III_psy_ratio ratio[2][2])
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
EncResult_t *const eov = &gfc->ov_enc;
|
|
FLOAT l3_xmin[2][2][SFBMAX];
|
|
|
|
FLOAT xrpow[2][2][576];
|
|
int frameBits[15];
|
|
int used_bits;
|
|
int max_bits[2][2];
|
|
int ch, gr, analog_silence, pad;
|
|
III_side_info_t *const l3_side = &gfc->l3_side;
|
|
|
|
const FLOAT (*const_l3_xmin)[2][SFBMAX] = (const FLOAT (*)[2][SFBMAX])l3_xmin;
|
|
const FLOAT (*const_xrpow)[2][576] = (const FLOAT (*)[2][576])xrpow;
|
|
const int (*const_max_bits)[2] = (const int (*)[2])max_bits;
|
|
|
|
(void) ms_ener_ratio; /* not used */
|
|
|
|
memset(xrpow, 0, sizeof(xrpow));
|
|
|
|
analog_silence = VBR_new_prepare(gfc, pe, ratio, l3_xmin, frameBits, max_bits, &pad);
|
|
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
gr_info *const cod_info = &l3_side->tt[gr][ch];
|
|
|
|
/* init_outer_loop sets up cod_info, scalefac and xrpow
|
|
*/
|
|
if (0 == init_xrpow(gfc, cod_info, xrpow[gr][ch])) {
|
|
max_bits[gr][ch] = 0; /* silent granule needs no bits */
|
|
}
|
|
} /* for ch */
|
|
} /* for gr */
|
|
|
|
/* quantize granules with lowest possible number of bits
|
|
*/
|
|
|
|
used_bits = VBR_encode_frame(gfc, const_xrpow, const_l3_xmin, const_max_bits);
|
|
|
|
if (!cfg->free_format) {
|
|
int i, j;
|
|
|
|
/* find lowest bitrate able to hold used bits
|
|
*/
|
|
if (analog_silence && !cfg->enforce_min_bitrate) {
|
|
/* we detected analog silence and the user did not specify
|
|
* any hard framesize limit, so start with smallest possible frame
|
|
*/
|
|
i = 1;
|
|
}
|
|
else {
|
|
i = cfg->vbr_min_bitrate_index;
|
|
}
|
|
|
|
for (; i < cfg->vbr_max_bitrate_index; i++) {
|
|
if (used_bits <= frameBits[i])
|
|
break;
|
|
}
|
|
if (i > cfg->vbr_max_bitrate_index) {
|
|
i = cfg->vbr_max_bitrate_index;
|
|
}
|
|
if (pad > 0) {
|
|
for (j = cfg->vbr_max_bitrate_index; j > i; --j) {
|
|
int const unused = frameBits[j] - used_bits;
|
|
if (unused <= pad)
|
|
break;
|
|
}
|
|
eov->bitrate_index = j;
|
|
}
|
|
else {
|
|
eov->bitrate_index = i;
|
|
}
|
|
}
|
|
else {
|
|
#if 0
|
|
static int mmm = 0;
|
|
int fff = getFramesize_kbps(gfc, used_bits);
|
|
int hhh = getFramesize_kbps(gfc, MAX_BITS_PER_GRANULE * cfg->mode_gr);
|
|
if (mmm < fff)
|
|
mmm = fff;
|
|
printf("demand=%3d kbps max=%3d kbps limit=%3d kbps\n", fff, mmm, hhh);
|
|
#endif
|
|
eov->bitrate_index = 0;
|
|
}
|
|
if (used_bits <= frameBits[eov->bitrate_index]) {
|
|
/* update Reservoire status */
|
|
int mean_bits, fullframebits;
|
|
fullframebits = ResvFrameBegin(gfc, &mean_bits);
|
|
assert(used_bits <= fullframebits);
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
gr_info const *const cod_info = &l3_side->tt[gr][ch];
|
|
ResvAdjust(gfc, cod_info);
|
|
}
|
|
}
|
|
ResvFrameEnd(gfc, mean_bits);
|
|
}
|
|
else {
|
|
/* SHOULD NOT HAPPEN INTERNAL ERROR
|
|
*/
|
|
ERRORF(gfc, "INTERNAL ERROR IN VBR NEW CODE, please send bug report\n");
|
|
exit(-1);
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/********************************************************************
|
|
*
|
|
* calc_target_bits()
|
|
*
|
|
* calculates target bits for ABR encoding
|
|
*
|
|
* mt 2000/05/31
|
|
*
|
|
********************************************************************/
|
|
|
|
static void
|
|
calc_target_bits(lame_internal_flags * gfc,
|
|
const FLOAT pe[2][2],
|
|
FLOAT const ms_ener_ratio[2],
|
|
int targ_bits[2][2], int *analog_silence_bits, int *max_frame_bits)
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
EncResult_t *const eov = &gfc->ov_enc;
|
|
III_side_info_t const *const l3_side = &gfc->l3_side;
|
|
FLOAT res_factor;
|
|
int gr, ch, totbits, mean_bits;
|
|
int framesize = 576 * cfg->mode_gr;
|
|
|
|
eov->bitrate_index = cfg->vbr_max_bitrate_index;
|
|
*max_frame_bits = ResvFrameBegin(gfc, &mean_bits);
|
|
|
|
eov->bitrate_index = 1;
|
|
mean_bits = getframebits(gfc) - cfg->sideinfo_len * 8;
|
|
*analog_silence_bits = mean_bits / (cfg->mode_gr * cfg->channels_out);
|
|
|
|
mean_bits = cfg->vbr_avg_bitrate_kbps * framesize * 1000;
|
|
if (gfc->sv_qnt.substep_shaping & 1)
|
|
mean_bits *= 1.09;
|
|
mean_bits /= cfg->samplerate_out;
|
|
mean_bits -= cfg->sideinfo_len * 8;
|
|
mean_bits /= (cfg->mode_gr * cfg->channels_out);
|
|
|
|
/*
|
|
res_factor is the percentage of the target bitrate that should
|
|
be used on average. the remaining bits are added to the
|
|
bitreservoir and used for difficult to encode frames.
|
|
|
|
Since we are tracking the average bitrate, we should adjust
|
|
res_factor "on the fly", increasing it if the average bitrate
|
|
is greater than the requested bitrate, and decreasing it
|
|
otherwise. Reasonable ranges are from .9 to 1.0
|
|
|
|
Until we get the above suggestion working, we use the following
|
|
tuning:
|
|
compression ratio res_factor
|
|
5.5 (256kbps) 1.0 no need for bitreservoir
|
|
11 (128kbps) .93 7% held for reservoir
|
|
|
|
with linear interpolation for other values.
|
|
|
|
*/
|
|
res_factor = .93 + .07 * (11.0 - cfg->compression_ratio) / (11.0 - 5.5);
|
|
if (res_factor < .90)
|
|
res_factor = .90;
|
|
if (res_factor > 1.00)
|
|
res_factor = 1.00;
|
|
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
int sum = 0;
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
targ_bits[gr][ch] = res_factor * mean_bits;
|
|
|
|
if (pe[gr][ch] > 700) {
|
|
int add_bits = (pe[gr][ch] - 700) / 1.4;
|
|
|
|
gr_info const *const cod_info = &l3_side->tt[gr][ch];
|
|
targ_bits[gr][ch] = res_factor * mean_bits;
|
|
|
|
/* short blocks use a little extra, no matter what the pe */
|
|
if (cod_info->block_type == SHORT_TYPE) {
|
|
if (add_bits < mean_bits / 2)
|
|
add_bits = mean_bits / 2;
|
|
}
|
|
/* at most increase bits by 1.5*average */
|
|
if (add_bits > mean_bits * 3 / 2)
|
|
add_bits = mean_bits * 3 / 2;
|
|
else if (add_bits < 0)
|
|
add_bits = 0;
|
|
|
|
targ_bits[gr][ch] += add_bits;
|
|
}
|
|
if (targ_bits[gr][ch] > MAX_BITS_PER_CHANNEL) {
|
|
targ_bits[gr][ch] = MAX_BITS_PER_CHANNEL;
|
|
}
|
|
sum += targ_bits[gr][ch];
|
|
} /* for ch */
|
|
if (sum > MAX_BITS_PER_GRANULE) {
|
|
for (ch = 0; ch < cfg->channels_out; ++ch) {
|
|
targ_bits[gr][ch] *= MAX_BITS_PER_GRANULE;
|
|
targ_bits[gr][ch] /= sum;
|
|
}
|
|
}
|
|
} /* for gr */
|
|
|
|
if (gfc->ov_enc.mode_ext == MPG_MD_MS_LR)
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
reduce_side(targ_bits[gr], ms_ener_ratio[gr], mean_bits * cfg->channels_out,
|
|
MAX_BITS_PER_GRANULE);
|
|
}
|
|
|
|
/* sum target bits
|
|
*/
|
|
totbits = 0;
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
if (targ_bits[gr][ch] > MAX_BITS_PER_CHANNEL)
|
|
targ_bits[gr][ch] = MAX_BITS_PER_CHANNEL;
|
|
totbits += targ_bits[gr][ch];
|
|
}
|
|
}
|
|
|
|
/* repartion target bits if needed
|
|
*/
|
|
if (totbits > *max_frame_bits && totbits > 0) {
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
targ_bits[gr][ch] *= *max_frame_bits;
|
|
targ_bits[gr][ch] /= totbits;
|
|
}
|
|
}
|
|
}
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/********************************************************************
|
|
*
|
|
* ABR_iteration_loop()
|
|
*
|
|
* encode a frame with a disired average bitrate
|
|
*
|
|
* mt 2000/05/31
|
|
*
|
|
********************************************************************/
|
|
|
|
void
|
|
ABR_iteration_loop(lame_internal_flags * gfc, const FLOAT pe[2][2],
|
|
const FLOAT ms_ener_ratio[2], const III_psy_ratio ratio[2][2])
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
EncResult_t *const eov = &gfc->ov_enc;
|
|
FLOAT l3_xmin[SFBMAX];
|
|
FLOAT xrpow[576];
|
|
int targ_bits[2][2];
|
|
int mean_bits, max_frame_bits;
|
|
int ch, gr, ath_over;
|
|
int analog_silence_bits;
|
|
gr_info *cod_info;
|
|
III_side_info_t *const l3_side = &gfc->l3_side;
|
|
|
|
mean_bits = 0;
|
|
|
|
calc_target_bits(gfc, pe, ms_ener_ratio, targ_bits, &analog_silence_bits, &max_frame_bits);
|
|
|
|
/* encode granules
|
|
*/
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
|
|
if (gfc->ov_enc.mode_ext == MPG_MD_MS_LR) {
|
|
ms_convert(&gfc->l3_side, gr);
|
|
}
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
FLOAT adjust, masking_lower_db;
|
|
cod_info = &l3_side->tt[gr][ch];
|
|
|
|
if (cod_info->block_type != SHORT_TYPE) { /* NORM, START or STOP type */
|
|
/* adjust = 1.28/(1+exp(3.5-pe[gr][ch]/300.))-0.05; */
|
|
adjust = 0;
|
|
masking_lower_db = gfc->sv_qnt.mask_adjust - adjust;
|
|
}
|
|
else {
|
|
/* adjust = 2.56/(1+exp(3.5-pe[gr][ch]/300.))-0.14; */
|
|
adjust = 0;
|
|
masking_lower_db = gfc->sv_qnt.mask_adjust_short - adjust;
|
|
}
|
|
gfc->sv_qnt.masking_lower = pow(10.0, masking_lower_db * 0.1);
|
|
|
|
|
|
/* cod_info, scalefac and xrpow get initialized in init_outer_loop
|
|
*/
|
|
init_outer_loop(gfc, cod_info);
|
|
if (init_xrpow(gfc, cod_info, xrpow)) {
|
|
/* xr contains energy we will have to encode
|
|
* calculate the masking abilities
|
|
* find some good quantization in outer_loop
|
|
*/
|
|
ath_over = calc_xmin(gfc, &ratio[gr][ch], cod_info, l3_xmin);
|
|
if (0 == ath_over) /* analog silence */
|
|
targ_bits[gr][ch] = analog_silence_bits;
|
|
|
|
(void) outer_loop(gfc, cod_info, l3_xmin, xrpow, ch, targ_bits[gr][ch]);
|
|
}
|
|
iteration_finish_one(gfc, gr, ch);
|
|
} /* ch */
|
|
} /* gr */
|
|
|
|
/* find a bitrate which can refill the resevoir to positive size.
|
|
*/
|
|
for (eov->bitrate_index = cfg->vbr_min_bitrate_index;
|
|
eov->bitrate_index <= cfg->vbr_max_bitrate_index; eov->bitrate_index++) {
|
|
if (ResvFrameBegin(gfc, &mean_bits) >= 0)
|
|
break;
|
|
}
|
|
assert(eov->bitrate_index <= cfg->vbr_max_bitrate_index);
|
|
|
|
ResvFrameEnd(gfc, mean_bits);
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
/************************************************************************
|
|
*
|
|
* CBR_iteration_loop()
|
|
*
|
|
* author/date??
|
|
*
|
|
* encodes one frame of MP3 data with constant bitrate
|
|
*
|
|
************************************************************************/
|
|
|
|
void
|
|
CBR_iteration_loop(lame_internal_flags * gfc, const FLOAT pe[2][2],
|
|
const FLOAT ms_ener_ratio[2], const III_psy_ratio ratio[2][2])
|
|
{
|
|
SessionConfig_t const *const cfg = &gfc->cfg;
|
|
FLOAT l3_xmin[SFBMAX];
|
|
FLOAT xrpow[576];
|
|
int targ_bits[2];
|
|
int mean_bits, max_bits;
|
|
int gr, ch;
|
|
III_side_info_t *const l3_side = &gfc->l3_side;
|
|
gr_info *cod_info;
|
|
|
|
(void) ResvFrameBegin(gfc, &mean_bits);
|
|
|
|
/* quantize! */
|
|
for (gr = 0; gr < cfg->mode_gr; gr++) {
|
|
|
|
/* calculate needed bits
|
|
*/
|
|
max_bits = on_pe(gfc, pe, targ_bits, mean_bits, gr, gr);
|
|
|
|
if (gfc->ov_enc.mode_ext == MPG_MD_MS_LR) {
|
|
ms_convert(&gfc->l3_side, gr);
|
|
reduce_side(targ_bits, ms_ener_ratio[gr], mean_bits, max_bits);
|
|
}
|
|
|
|
for (ch = 0; ch < cfg->channels_out; ch++) {
|
|
FLOAT adjust, masking_lower_db;
|
|
cod_info = &l3_side->tt[gr][ch];
|
|
|
|
if (cod_info->block_type != SHORT_TYPE) { /* NORM, START or STOP type */
|
|
/* adjust = 1.28/(1+exp(3.5-pe[gr][ch]/300.))-0.05; */
|
|
adjust = 0;
|
|
masking_lower_db = gfc->sv_qnt.mask_adjust - adjust;
|
|
}
|
|
else {
|
|
/* adjust = 2.56/(1+exp(3.5-pe[gr][ch]/300.))-0.14; */
|
|
adjust = 0;
|
|
masking_lower_db = gfc->sv_qnt.mask_adjust_short - adjust;
|
|
}
|
|
gfc->sv_qnt.masking_lower = pow(10.0, masking_lower_db * 0.1);
|
|
|
|
/* init_outer_loop sets up cod_info, scalefac and xrpow
|
|
*/
|
|
init_outer_loop(gfc, cod_info);
|
|
if (init_xrpow(gfc, cod_info, xrpow)) {
|
|
/* xr contains energy we will have to encode
|
|
* calculate the masking abilities
|
|
* find some good quantization in outer_loop
|
|
*/
|
|
(void) calc_xmin(gfc, &ratio[gr][ch], cod_info, l3_xmin);
|
|
(void) outer_loop(gfc, cod_info, l3_xmin, xrpow, ch, targ_bits[ch]);
|
|
}
|
|
|
|
iteration_finish_one(gfc, gr, ch);
|
|
assert(cod_info->part2_3_length <= MAX_BITS_PER_CHANNEL);
|
|
assert(cod_info->part2_3_length <= targ_bits[ch]);
|
|
} /* for ch */
|
|
} /* for gr */
|
|
|
|
ResvFrameEnd(gfc, mean_bits);
|
|
}
|