Context Navigation

← Previous Change
Next Change →

psy.c

Timestamp:

10/07/06 02:49:28 (19 years ago)

Author:

r2d

Message:

fixed a LOT of bugs
fixed a bug that took me 2 days to find :)
remember to ALWAYS use -Wall with a C compiler (C++ is great !!!)
files can be played, but are not bit identical with the 1.15w encoder (the last digits of floats are not the same) - must be fixed.

File:

: 1 edited

mppenc/branches/r2d/libmpcpsy/psy.c (modified) (32 diffs)

Legend:

: Unmodified
: Added
: Removed

mppenc/branches/r2d/libmpcpsy/psy.c

-                      r66
+                      r71
 #include "minimax.h"
+// psy_tab.c
 extern const float  iw        [PART_LONG];      // inverse partition-width for long
 extern const float  iw_short  [PART_SHORT];     // inverse partition-width for short
 …
 extern const int    wh        [PART_LONG];      // w_high for long
 extern const int    wh_short  [PART_SHORT];     // w_high for short
+extern float        MinVal   [PART_LONG];       // minimum quality that's adapted to the model, minval for long
+extern float  Loudness [PART_LONG];               // weighting factors for loudness calculation
+extern float  SPRD     [PART_LONG] [PART_LONG];   // tabulated spreading function
+extern float  O_MAX;
+extern float  O_MIN;
+extern float  FAC1;
+extern float  FAC2;                               // constants for offset calculation
+extern float  partLtq  [PART_LONG];               // threshold in quiet (partitions)
+extern float  invLtq   [PART_LONG];               // inverse threshold in quiet (partitions, long)
+extern float  fftLtq   [512];                     // threshold in quiet (FFT)
+// ans.c
+extern float         ANSspec_L [MAX_ANS_LINES];
+extern float         ANSspec_R [MAX_ANS_LINES];         // L/R-masking threshold for ANS
+extern float         ANSspec_M [MAX_ANS_LINES];
+extern float         ANSspec_S [MAX_ANS_LINES];         // M/S-masking threshold for ANS
+void   Init_Psychoakustiktabellen ( PsyModel* );
+int    CVD2048 ( PsyModel*, const float*, int* );
 // Antialiasing for calculation of the subband power
 …
 /* V A R I A B L E S */
+static float         a          [PART_LONG];
+static float         b          [PART_LONG];
+static float         c          [PART_LONG];
+static float         d          [PART_LONG];           // Integrations for tmpMask
 static float  Xsave_L    [3 * 512];
 static float  Xsave_R    [3 * 512];             // FFT-Amplitudes L/R
 static float  Ysave_L    [3 * 512];
 static float  Ysave_R    [3 * 512];             // FFT-Phases L/R
+static float         T_L        [PART_LONG];
+static float         T_R        [PART_LONG];           // time-constants for tmpMask
+static float         pre_erg_L[2][PART_SHORT];
+static float         pre_erg_R[2][PART_SHORT];          // Preecho-control short
+static float         PreThr_L   [PART_LONG];
+static float         PreThr_R   [PART_LONG];           // for Pre-Echo-control L/R
+static float         tmp_Mask_L [PART_LONG];
+static float         tmp_Mask_R [PART_LONG];           // for Post-Masking L/R
+static int           Vocal_L    [MAX_CVD_LINE + 4];
+static int           Vocal_R    [MAX_CVD_LINE + 4];    // FFT-Line belongs to harmonic?
 /* F U N C T I O N S */
 …
         memset ( Ysave_L,   0, sizeof Ysave_L );
         memset ( Ysave_R,   0, sizeof Ysave_R );
         memset ( m->a,         0, sizeof m->a       );
         memset ( m->b,         0, sizeof m->b       );
         memset ( m->c,         0, sizeof m->c       );
         memset ( m->d,         0, sizeof m->d       );
         memset ( m->T_L,       0, sizeof m->T_L     );
         memset ( m->T_R,       0, sizeof m->T_R     );
         memset ( m->Vocal_L,   0, sizeof m->Vocal_L );
         memset ( m->Vocal_R,   0, sizeof m->Vocal_R );
+        memset ( a,         0, sizeof a       );
+        memset ( b,         0, sizeof b       );
+        memset ( c,         0, sizeof c       );
+        memset ( d,         0, sizeof d       );
+        memset ( T_L,       0, sizeof T_L     );
+        memset ( T_R,       0, sizeof T_R     );
+        memset ( Vocal_L,   0, sizeof Vocal_L );
+        memset ( Vocal_R,   0, sizeof Vocal_R );
         m->SampleFreq = 0.;
 …
         m->KBD1 = 2.;
         m->KBD2 = -1.;
+        m->Ltq_offset = 0;
+        m->Ltq_max = 0;
+        m->EarModelFlag = 0;
     // generate FFT lookup-tables with largest FFT-size of 1024
         Init_FFT (m);
+        Init_Psychoakustiktabellen (m);
     // setting pre-echo variables to Ltq
         for ( i = 0; i < PART_LONG; i++ ) {
                 m->pre_erg_L  [0][i/3] = m->pre_erg_R  [0][i/3] =
                                 m->pre_erg_L  [1][i/3] = m->pre_erg_R  [1][i/3] =
                                 m->tmp_Mask_L [i]   = m->tmp_Mask_R [i]   =
                                 m->PreThr_L   [i]   = m->PreThr_R   [i]   = m->partLtq [i];
+                pre_erg_L  [0][i/3] = pre_erg_R  [0][i/3] =
+                                pre_erg_L  [1][i/3] = pre_erg_R  [1][i/3] =
+                                tmp_Mask_L [i]   = tmp_Mask_R [i]   =
+                                PreThr_L   [i]   = PreThr_R   [i]   = partLtq [i];
+        }
 …
 // SPRD describes the spreading function as calculated in psy_tab.c
 static void
 SpreadingSignal ( PsyModel* m, const float* erg, const float* werg, float* res,
+SpreadingSignal ( const float* erg, const float* werg, float* res,
                                   float* wres )
+{
 …
         start = maxi(k-5, 0);           // minimum affected partition
         stop  = mini(k+7, PART_LONG-1); // maximum affected partition
         sprd  = m->SPRD[k] + start;         // load vector
+        sprd  = SPRD[k] + start;         // load vector
         e     = *erg;
         ew    = *werg;
 …
 // output: masking threshold *erg after applying the tonality-offset
 static void
 ApplyTonalityOffset ( PsyModel* m, float* erg0, float* erg1, const float* werg0, const float* werg1 )
+ApplyTonalityOffset ( float* erg0, float* erg1, const float* werg0, const float* werg1 )
+{
     int    n;
 …
     for ( n = 0; n < PART_LONG; n++ ) {
         quot = *werg0++ / *erg0;
         if      (quot <= 0.05737540597f) Offset = m->O_MAX;
         else if (quot <  0.5871011603f ) Offset = m->FAC1 * POW (quot, m->FAC2);
         else                             Offset = m->O_MIN;
         *erg0++ *= iw[n] * minf(m->MinVal[n], Offset);
+        if      (quot <= 0.05737540597f) Offset = O_MAX;
+        else if (quot <  0.5871011603f ) Offset = FAC1 * POW (quot, FAC2);
+        else                             Offset = O_MIN;
+        *erg0++ *= iw[n] * minf(MinVal[n], Offset);
         quot = *werg1++ / *erg1;
         if      (quot <= 0.05737540597f) Offset = m->O_MAX;
         else if (quot <  0.5871011603f ) Offset = m->FAC1 * POW (quot, m->FAC2);
         else                             Offset = m->O_MIN;
                 *erg1++ *= iw[n] * minf(m->MinVal[n], Offset);
+        if      (quot <= 0.05737540597f) Offset = O_MAX;
+        else if (quot <  0.5871011603f ) Offset = FAC1 * POW (quot, FAC2);
+        else                             Offset = O_MIN;
+                *erg1++ *= iw[n] * minf(MinVal[n], Offset);
+    }
 …
+{
     static float  loud   = 0.f;
         float*        weight = m->Loudness;
+        float*        weight = Loudness;
     float         sum    = 0.f;
     int           n;
 …
 // output: tracked Integrations *a and *b, time constant *tau
 static void
 CalcTemporalThreshold ( PsyModel* m, float* a, float* b, float* tau, float* frqthr, float* tmpthr )
+CalcTemporalThreshold ( float* a, float* b, float* tau, float* frqthr, float* tmpthr )
+{
     int    n;
 …
     for ( n = 0; n < PART_LONG; n++ ) {
         // following calculations relative to threshold in quiet
         frqthr[n] *= m->invLtq[n];
                 tmpthr[n] *= m->invLtq[n];
+        frqthr[n] *= invLtq[n];
+                tmpthr[n] *= invLtq[n];
         // new post-masking 'tmp' via time constant tau, if old post-masking  > Ltq (=1)
 …
         // use post-masking of (Re-Normalization)
                 tmpthr[n] = maxf (frqthr[n], tmp) * m->partLtq[n];
+                tmpthr[n] = maxf (frqthr[n], tmp) * partLtq[n];
+    }
 …
 // inline, because it's called 4x
 static void
+ApplyLtq ( PsyModel* m,
+                   float*        thr0,
+ApplyLtq ( float*        thr0,
            float*        thr1,
            const float*  partThr0,
 …
 #else
             // Applies a much more gentle ATH rolloff + 6 dB more dynamic
             ltq   = sqrt (ms * m->fftLtq [k]);
+            ltq   = sqrt (ms * fftLtq [k]);
             tmp   = sqrt (partThr0 [n]) + ltq;
             *thr0 = tmp * tmp;
 …
     // 'ClearVocalDetection'-Process
     if ( m->CVD_used ) {
         memset ( m->Vocal_L, 0, sizeof m->Vocal_L );
         memset ( m->Vocal_R, 0, sizeof m->Vocal_R );
+        memset ( Vocal_L, 0, sizeof Vocal_L );
+        memset ( Vocal_R, 0, sizeof Vocal_R );
         // left channel
         PowSpec2048 ( &data->L[0], Xerg );
         isvoc_L = CVD2048 ( Xerg, m->Vocal_L );
+        isvoc_L = CVD2048 ( m, Xerg, Vocal_L );
         // right channel
         PowSpec2048 ( &data->R[0], Xerg );
         isvoc_R = CVD2048 ( Xerg, m->Vocal_R );
+        isvoc_R = CVD2048 ( m, Xerg, Vocal_R );
+    }
 …
     memmove ( Xsave_L+512, Xsave_L, 1024*sizeof(float) );
     memmove ( Ysave_L+512, Ysave_L, 1024*sizeof(float) );
     CalcUnpred ( m, MaxLine, erg0, phs0, isvoc_L ? m->Vocal_L : NULL, Xsave_L, Ysave_L, cw_L );
+    CalcUnpred ( m, MaxLine, erg0, phs0, isvoc_L ? Vocal_L : NULL, Xsave_L, Ysave_L, cw_L );
     // right
     memmove ( Xsave_R+512, Xsave_R, 1024*sizeof(float) );
     memmove ( Ysave_R+512, Ysave_R, 1024*sizeof(float) );
     CalcUnpred ( m, MaxLine, erg1, phs1, isvoc_R ? m->Vocal_R : NULL, Xsave_R, Ysave_R, cw_R );
+    CalcUnpred ( m, MaxLine, erg1, phs1, isvoc_R ? Vocal_R : NULL, Xsave_R, Ysave_R, cw_R );
     // calculation of the weighted acoustic pressures per each partition
 …
     memset ( clow_L    , 0, sizeof clow_L );
     memset ( sim_Mask_L, 0, sizeof sim_Mask_L );
     SpreadingSignal ( m, Ls_L, cLs_L, sim_Mask_L, clow_L );
+    SpreadingSignal ( Ls_L, cLs_L, sim_Mask_L, clow_L );
     // right
     memset ( clow_R    , 0, sizeof clow_R );
     memset ( sim_Mask_R, 0, sizeof sim_Mask_R );
     SpreadingSignal ( m, Ls_R, cLs_R, sim_Mask_R, clow_R );
+    SpreadingSignal ( Ls_R, cLs_R, sim_Mask_R, clow_R );
     // Offset depending on tonality
     ApplyTonalityOffset ( m, sim_Mask_L, sim_Mask_R, clow_L, clow_R );
+    ApplyTonalityOffset ( sim_Mask_L, sim_Mask_R, clow_L, clow_R );
     // handling of transient signals
 …
     PowSpec256 ( &data->L[432+SHORTFFT_OFFSET], F_256[3] );
     // calculate short Threshold
     CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_L, m->pre_erg_L, TransientL );
+    CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_L, pre_erg_L, TransientL );
     // calculate four short FFTs (right)
 …
     PowSpec256 ( &data->R[432+SHORTFFT_OFFSET], F_256[3] );
     // calculate short Threshold
     CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_R, m->pre_erg_R, TransientR );
+    CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_R, pre_erg_R, TransientR );
     // dynamic adjustment of the threshold in quiet to the loudness of the current sequence
 …
     // utilization of the temporal post-masking
     if ( m->tmpMask_used ) {
                 CalcTemporalThreshold (m, m->a, m->b, m->T_L, sim_Mask_L, m->tmp_Mask_L );
                 CalcTemporalThreshold (m, m->c, m->d, m->T_R, sim_Mask_R, m->tmp_Mask_R );
                 memcpy ( sim_Mask_L, m->tmp_Mask_L, sizeof sim_Mask_L );
                 memcpy ( sim_Mask_R, m->tmp_Mask_R, sizeof sim_Mask_R );
+                CalcTemporalThreshold ( a, b, T_L, sim_Mask_L, tmp_Mask_L );
+                CalcTemporalThreshold ( c, d, T_R, sim_Mask_R, tmp_Mask_R );
+                memcpy ( sim_Mask_L, tmp_Mask_L, sizeof sim_Mask_L );
+                memcpy ( sim_Mask_R, tmp_Mask_R, sizeof sim_Mask_R );
+    }
 …
     // Pre-Echo control
         PreechoControl ( PartThr_L, m->PreThr_L, sim_Mask_L, PartThr_R, m->PreThr_R, sim_Mask_R );
+        PreechoControl ( PartThr_L,PreThr_L, sim_Mask_L, PartThr_R, PreThr_R, sim_Mask_R );
     // utilization of the threshold in quiet
     ApplyLtq ( m, Thr_L, Thr_R, PartThr_L, PartThr_R, factorLTQ, 0 );
+    ApplyLtq ( Thr_L, Thr_R, PartThr_L, PartThr_R, factorLTQ, 0 );
     // Consideration of aliasing between the subbands (noise is smeared)
 …
         // calculate masking thresholds for M/S
         CalcMSThreshold ( m, Ls_L, Ls_R, Ls_M, Ls_S, PartThr_L, PartThr_R, PartThr_M, PartThr_S );
         ApplyLtq ( m, Thr_M, Thr_S, PartThr_M, PartThr_S, factorLTQ, 1 );
+        ApplyLtq ( Thr_M, Thr_S, PartThr_M, PartThr_S, factorLTQ, 1 );
         // Consideration of aliasing between the subbands (noise is smeared)
 …
         if ( m->NS_Order > 0 ) {       // providing the Noise Shaping thresholds
                 memcpy ( m->ANSspec_L, Thr_L, sizeof m->ANSspec_L );
                 memcpy ( m->ANSspec_R, Thr_R, sizeof m->ANSspec_R );
                 memcpy ( m->ANSspec_M, Thr_M, sizeof m->ANSspec_M );
                 memcpy ( m->ANSspec_S, Thr_S, sizeof m->ANSspec_S );
+                memcpy ( ANSspec_L, Thr_L, sizeof ANSspec_L );
+                memcpy ( ANSspec_R, Thr_R, sizeof ANSspec_R );
+                memcpy ( ANSspec_M, Thr_M, sizeof ANSspec_M );
+                memcpy ( ANSspec_S, Thr_S, sizeof ANSspec_S );
+    }
     /***************************************************************************************/
 …
     memmove ( Xsave_L+512, Xsave_L, 1024*sizeof(float) );
     memmove ( Ysave_L+512, Ysave_L, 1024*sizeof(float) );
         CalcUnpred ( m, MaxLine, erg0, phs0, isvoc_L ? m->Vocal_L : NULL, Xsave_L, Ysave_L, cw_L );
+        CalcUnpred ( m, MaxLine, erg0, phs0, isvoc_L ? Vocal_L : NULL, Xsave_L, Ysave_L, cw_L );
     // right
     memmove ( Xsave_R+512, Xsave_R, 1024*sizeof(float) );
     memmove ( Ysave_R+512, Ysave_R, 1024*sizeof(float) );
         CalcUnpred ( m, MaxLine, erg1, phs1, isvoc_R ? m->Vocal_R : NULL, Xsave_R, Ysave_R, cw_R );
+        CalcUnpred ( m, MaxLine, erg1, phs1, isvoc_R ? Vocal_R : NULL, Xsave_R, Ysave_R, cw_R );
     // calculation of the weighted acoustic pressure per each partition
 …
     memset ( clow_L    , 0, sizeof clow_L );
     memset ( sim_Mask_L, 0, sizeof sim_Mask_L );
     SpreadingSignal ( m, Ls_L, cLs_L, sim_Mask_L, clow_L );
+    SpreadingSignal ( Ls_L, cLs_L, sim_Mask_L, clow_L );
     // right
     memset ( clow_R    , 0, sizeof clow_R );
     memset ( sim_Mask_R, 0, sizeof sim_Mask_R );
     SpreadingSignal ( m, Ls_R, cLs_R, sim_Mask_R, clow_R );
+    SpreadingSignal ( Ls_R, cLs_R, sim_Mask_R, clow_R );
     // Offset depending on tonality
     ApplyTonalityOffset ( m, sim_Mask_L, sim_Mask_R, clow_L, clow_R );
+    ApplyTonalityOffset ( sim_Mask_L, sim_Mask_R, clow_L, clow_R );
     // Handling of transient signals
 …
     PowSpec256 ( &data->L[1008+SHORTFFT_OFFSET], F_256[3] );
     // calculate short Threshold
         CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_L, m->pre_erg_L, TransientL );
+        CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_L, pre_erg_L, TransientL );
     // calculate four short FFTs (right)
 …
     PowSpec256 ( &data->R[1008+SHORTFFT_OFFSET], F_256[3] );
     // calculate short Threshold
         CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_R, m->pre_erg_R, TransientR );
+        CalcShortThreshold ( m, F_256, m->ShortThr, shortThr_R, pre_erg_R, TransientR );
     // dynamic adjustment of threshold in quiet to loudness of the current sequence
 …
     // utilization of temporal post-masking
         if (m->tmpMask_used) {
                 CalcTemporalThreshold ( m, m->a, m->b, m->T_L, sim_Mask_L, m->tmp_Mask_L );
                 CalcTemporalThreshold ( m, m->c, m->d, m->T_R, sim_Mask_R, m->tmp_Mask_R );
                 memcpy ( sim_Mask_L, m->tmp_Mask_L, sizeof sim_Mask_L );
                 memcpy ( sim_Mask_R, m->tmp_Mask_R, sizeof sim_Mask_R );
+                CalcTemporalThreshold ( a, b, T_L, sim_Mask_L, tmp_Mask_L );
+                CalcTemporalThreshold ( c, d, T_R, sim_Mask_R, tmp_Mask_R );
+                memcpy ( sim_Mask_L, tmp_Mask_L, sizeof sim_Mask_L );
+                memcpy ( sim_Mask_R, tmp_Mask_R, sizeof sim_Mask_R );
+    }
 …
     // Pre-Echo control
         PreechoControl ( PartThr_L, m->PreThr_L, sim_Mask_L, PartThr_R, m->PreThr_R, sim_Mask_R );
+        PreechoControl ( PartThr_L, PreThr_L, sim_Mask_L, PartThr_R, PreThr_R, sim_Mask_R );
     // utilization of threshold in quiet
     ApplyLtq ( m, Thr_L, Thr_R, PartThr_L, PartThr_R, factorLTQ, 0 );
+    ApplyLtq ( Thr_L, Thr_R, PartThr_L, PartThr_R, factorLTQ, 0 );
     // Consideration of aliasing between the subbands (noise is smeared)
 …
         // calculate masking thresholds for M/S
         CalcMSThreshold ( m, Ls_L, Ls_R, Ls_M, Ls_S, PartThr_L, PartThr_R, PartThr_M, PartThr_S );
         ApplyLtq ( m, Thr_M, Thr_S, PartThr_M, PartThr_S, factorLTQ, 1 );
+        ApplyLtq ( Thr_M, Thr_S, PartThr_M, PartThr_S, factorLTQ, 1 );
         // Consideration of aliasing between the subbands (noise is smeared)
 …
         if ( m->NS_Order > 0 ) {
         for ( n = 0; n < MAX_ANS_LINES; n++ ) {                 // providing Noise Shaping thresholds
                         m->ANSspec_L [n] = minf ( m->ANSspec_L [n], Thr_L [n] );
                         m->ANSspec_R [n] = minf ( m->ANSspec_R [n], Thr_R [n] );
                         m->ANSspec_M [n] = minf ( m->ANSspec_M [n], Thr_M [n] );
                         m->ANSspec_S [n] = minf ( m->ANSspec_S [n], Thr_S [n] );
+                        ANSspec_L [n] = minf ( ANSspec_L [n], Thr_L [n] );
+                        ANSspec_R [n] = minf ( ANSspec_R [n], Thr_R [n] );
+                        ANSspec_M [n] = minf ( ANSspec_M [n], Thr_M [n] );
+                        ANSspec_S [n] = minf ( ANSspec_S [n], Thr_S [n] );
+        }
+    }

Note: See TracChangeset for help on using the changeset viewer.

Context Navigation

Changeset 71 for mppenc/branches/r2d/libmpcpsy/psy.c

Legend:

mppenc/branches/r2d/libmpcpsy/psy.c

Download in other formats: