xiph
/
vorbis
Mirror von https://git.xiph.org/vorbis.git


			
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864
							/********************************************************************
 *                                                                  *
 * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE.   *
 * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS     *
 * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE *
 * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING.       *
 *                                                                  *
 * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2001             *
 * by the XIPHOPHORUS Company http://www.xiph.org/                  *

 ********************************************************************

 function: psychoacoustics not including preecho
 last mod: $Id: psy.c,v 1.44.2.2 2001/03/28 04:50:55 segher Exp $

 ********************************************************************/

#include <stdlib.h>
#include <math.h>
#include <string.h>
#include "vorbis/codec.h"
#include "codec_internal.h"

#include "masking.h"
#include "psy.h"
#include "os.h"
#include "lpc.h"
#include "smallft.h"
#include "scales.h"
#include "misc.h"


//#define todB_t(x) todB(x)


#define todB_t(x) (dbtab[(*(int *)&(x) >> 20)&2047])

static float dbtab[2048];

static void initdbtab()
{
	int i, x;

	for (i = 0; i < 2048; i++) {
		*(int *)(dbtab + i) = (i << 20) | (1 << 19);
		dbtab[i] = todB(dbtab[i]);
//fprintf(stderr, "%4d: %08x %12.6f\n", i, (i << 20) | (1 << 19), dbtab[i]);
	}
}


#define NEGINF -9999.f

/* Why Bark scale for encoding but not masking computation? Because
   masking has a strong harmonic dependancy */

/* the beginnings of real psychoacoustic infrastructure.  This is
   still not tightly tuned */
void _vi_psy_free(vorbis_info_psy *i){
  if(i){
    memset(i,0,sizeof(vorbis_info_psy));
    _ogg_free(i);
  }
}

vorbis_info_psy *_vi_psy_copy(vorbis_info_psy *i){
  vorbis_info_psy *ret=_ogg_malloc(sizeof(vorbis_info_psy));
  memcpy(ret,i,sizeof(vorbis_info_psy));
  return(ret);
}

/* Set up decibel threshold slopes on a Bark frequency scale */
/* ATH is the only bit left on a Bark scale.  No reason to change it
   right now */
static void set_curve(float *ref,float *c,int n, float crate){
  int i,j=0;

  for(i=0;i<MAX_BARK-1;i++){
    int endpos=rint(fromBARK(i+1)*2*n/crate);
    float base=ref[i];
    if(j<endpos){
      float delta=(ref[i+1]-base)/(endpos-j);
      for(;j<endpos && j<n;j++){
	c[j]=base;
	base+=delta;
      }
    }
  }
}

static void min_curve(float *c,
		       float *c2){
  int i;  
  for(i=0;i<EHMER_MAX;i++)if(c2[i]<c[i])c[i]=c2[i];
}
static void max_curve(float *c,
		       float *c2){
  int i;  
  for(i=0;i<EHMER_MAX;i++)if(c2[i]>c[i])c[i]=c2[i];
}

static void attenuate_curve(float *c,float att){
  int i;
  for(i=0;i<EHMER_MAX;i++)
    c[i]+=att;
}

static void interp_curve(float *c,float *c1,float *c2,float del){
  int i;
  for(i=0;i<EHMER_MAX;i++)
    c[i]=c2[i]*del+c1[i]*(1.f-del);
}

static void setup_curve(float **c,
			int band,
			float *curveatt_dB){
  int i,j;
  float ath[EHMER_MAX];
  float tempc[P_LEVELS][EHMER_MAX];

  memcpy(c[0]+2,c[4]+2,sizeof(float)*EHMER_MAX);
  memcpy(c[2]+2,c[4]+2,sizeof(float)*EHMER_MAX);

  /* we add back in the ATH to avoid low level curves falling off to
     -infinity and unneccessarily cutting off high level curves in the
     curve limiting (last step).  But again, remember... a half-band's
     settings must be valid over the whole band, and it's better to
     mask too little than too much, so be pessimal. */

  for(i=0;i<EHMER_MAX;i++){
    float oc_min=band*.5+(i-EHMER_OFFSET)*.125;
    float oc_max=band*.5+(i-EHMER_OFFSET+1)*.125;
    float bark=toBARK(fromOC(oc_min));
    int ibark=floor(bark);
    float del=bark-ibark;
    float ath_min,ath_max;

    if(ibark<26)
      ath_min=ATH_Bark_dB[ibark]*(1.f-del)+ATH_Bark_dB[ibark+1]*del;
    else
      ath_min=ATH_Bark_dB[25];

    bark=toBARK(fromOC(oc_max));
    ibark=floor(bark);
    del=bark-ibark;

    if(ibark<26)
      ath_max=ATH_Bark_dB[ibark]*(1.f-del)+ATH_Bark_dB[ibark+1]*del;
    else
      ath_max=ATH_Bark_dB[25];

    ath[i]=min(ath_min,ath_max);
  }

  /* The c array is comes in as dB curves at 20 40 60 80 100 dB.
     interpolate intermediate dB curves */
  for(i=1;i<P_LEVELS;i+=2){
    interp_curve(c[i]+2,c[i-1]+2,c[i+1]+2,.5);
  }

  /* normalize curves so the driving amplitude is 0dB */
  /* make temp curves with the ATH overlayed */
  for(i=0;i<P_LEVELS;i++){
    attenuate_curve(c[i]+2,curveatt_dB[i]);
    memcpy(tempc[i],ath,EHMER_MAX*sizeof(float));
    attenuate_curve(tempc[i],-i*10.f);
    max_curve(tempc[i],c[i]+2);
  }

  /* Now limit the louder curves.

     the idea is this: We don't know what the playback attenuation
     will be; 0dB SL moves every time the user twiddles the volume
     knob. So that means we have to use a single 'most pessimal' curve
     for all masking amplitudes, right?  Wrong.  The *loudest* sound
     can be in (we assume) a range of ...+100dB] SL.  However, sounds
     20dB down will be in a range ...+80], 40dB down is from ...+60],
     etc... */

  for(j=1;j<P_LEVELS;j++){
    min_curve(tempc[j],tempc[j-1]);
    min_curve(c[j]+2,tempc[j]);
  }

  /* add fenceposts */
  for(j=0;j<P_LEVELS;j++){

    for(i=0;i<EHMER_MAX;i++)
      if(c[j][i+2]>-200.f)break;  
    c[j][0]=i;

    for(i=EHMER_MAX-1;i>=0;i--)
      if(c[j][i+2]>-200.f)
	break;
    c[j][1]=i;

  }
}

void _vp_psy_init(vorbis_look_psy *p,vorbis_info_psy *vi,int n,long rate){
  long i,j;
  long maxoc;
  memset(p,0,sizeof(vorbis_look_psy));


initdbtab();

  p->eighth_octave_lines=vi->eighth_octave_lines;
  p->shiftoc=rint(log(vi->eighth_octave_lines*8)/log(2))-1;

  p->firstoc=toOC(.25f*rate/n)*(1<<(p->shiftoc+1))-vi->eighth_octave_lines;
  maxoc=toOC((n*.5f-.25f)*rate/n)*(1<<(p->shiftoc+1))+.5f;
  p->total_octave_lines=maxoc-p->firstoc+1;

  p->ath=_ogg_malloc(n*sizeof(float));
  p->octave=_ogg_malloc(n*sizeof(long));
  p->bark=_ogg_malloc(n*sizeof(float));
  p->vi=vi;
  p->n=n;

  /* set up the lookups for a given blocksize and sample rate */
  /* Vorbis max sample rate is currently limited by 26 Bark (54kHz) */
  set_curve(ATH_Bark_dB, p->ath,n,rate);
  for(i=0;i<n;i++)
    p->bark[i]=toBARK(rate/(2*n)*i); 

  for(i=0;i<n;i++)
    p->octave[i]=toOC((i*.5f+.25f)*rate/n)*(1<<(p->shiftoc+1))+.5f;

  p->tonecurves=_ogg_malloc(P_BANDS*sizeof(float **));
  p->noisemedian=_ogg_malloc(n*sizeof(float));
  p->inoisemedian=_ogg_malloc(n*sizeof(int));
  p->barknoisewindowlo=_ogg_malloc(n*sizeof(int));
  p->barknoisewindowhi=_ogg_malloc(n*sizeof(int));
  p->noiseoffset=_ogg_malloc(n*sizeof(float));
  p->peakatt=_ogg_malloc(P_BANDS*sizeof(float *));
  for(i=0;i<P_BANDS;i++){
    p->tonecurves[i]=_ogg_malloc(P_LEVELS*sizeof(float *));
    p->peakatt[i]=_ogg_malloc(P_LEVELS*sizeof(float));
  }

  for(i=0;i<P_BANDS;i++)
    for(j=0;j<P_LEVELS;j++){
      p->tonecurves[i][j]=_ogg_malloc((EHMER_MAX+2)*sizeof(float));
    }

  /* OK, yeah, this was a silly way to do it */
  memcpy(p->tonecurves[0][4]+2,tone_125_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[0][6]+2,tone_125_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[0][8]+2,tone_125_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[0][10]+2,tone_125_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[2][4]+2,tone_125_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[2][6]+2,tone_125_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[2][8]+2,tone_125_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[2][10]+2,tone_125_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[4][4]+2,tone_250_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[4][6]+2,tone_250_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[4][8]+2,tone_250_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[4][10]+2,tone_250_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[6][4]+2,tone_500_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[6][6]+2,tone_500_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[6][8]+2,tone_500_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[6][10]+2,tone_500_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[8][4]+2,tone_1000_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[8][6]+2,tone_1000_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[8][8]+2,tone_1000_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[8][10]+2,tone_1000_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[10][4]+2,tone_2000_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[10][6]+2,tone_2000_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[10][8]+2,tone_2000_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[10][10]+2,tone_2000_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[12][4]+2,tone_4000_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[12][6]+2,tone_4000_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[12][8]+2,tone_4000_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[12][10]+2,tone_4000_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[14][4]+2,tone_8000_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[14][6]+2,tone_8000_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[14][8]+2,tone_8000_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[14][10]+2,tone_8000_100dB_SL,sizeof(float)*EHMER_MAX);

  memcpy(p->tonecurves[16][4]+2,tone_8000_40dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[16][6]+2,tone_8000_60dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[16][8]+2,tone_8000_80dB_SL,sizeof(float)*EHMER_MAX);
  memcpy(p->tonecurves[16][10]+2,tone_8000_100dB_SL,sizeof(float)*EHMER_MAX);

  /* interpolate curves between */
  for(i=1;i<P_BANDS;i+=2)
    for(j=4;j<P_LEVELS;j+=2){
      memcpy(p->tonecurves[i][j]+2,p->tonecurves[i-1][j]+2,EHMER_MAX*sizeof(float));
      /*interp_curve(p->tonecurves[i][j],
		   p->tonecurves[i-1][j],
		   p->tonecurves[i+1][j],.5);*/
      min_curve(p->tonecurves[i][j]+2,p->tonecurves[i+1][j]+2);
    }

  /* set up the final curves */
  for(i=0;i<P_BANDS;i++)
    setup_curve(p->tonecurves[i],i,vi->toneatt[i]);

  /* set up attenuation levels */
  for(i=0;i<P_BANDS;i++)
    for(j=0;j<P_LEVELS;j++){
      p->peakatt[i][j]=p->vi->peakatt[i][j];
    }

  /* set up rolling noise median */
  for(i=0;i<n;i++){
    float halfoc=toOC((i+.5)*rate/(2.*n))*2.+2.;
    int inthalfoc;
    float del;
    
    if(halfoc<0)halfoc=0;
    if(halfoc>=P_BANDS-1)halfoc=P_BANDS-1;
    inthalfoc=(int)halfoc;
    del=halfoc-inthalfoc;

    p->noisemedian[i]=
      p->vi->noisemedian[inthalfoc*2]*(1.-del) + 
      p->vi->noisemedian[inthalfoc*2+2]*del;
    p->inoisemedian[i]=(int)(65536.0f*p->noisemedian[i]);
    p->noiseoffset[i]=
      p->vi->noisemedian[inthalfoc*2+1]*(1.-del) + 
      p->vi->noisemedian[inthalfoc*2+3]*del;
  }

  {
    long i=0,lo=0,hi=0;
    float bi;
    for(i=0;i<n;i++){
      /* find new lo/hi */
      bi=p->bark[i]+p->vi->noisewindowhi;
      for(;hi<n && (hi<i+p->vi->noisewindowhimin || p->bark[hi]<=bi);hi++) ;
      p->barknoisewindowhi[i] = hi;
      bi=p->bark[i]-p->vi->noisewindowlo;
      for(;lo<i && lo+p->vi->noisewindowlomin<i && p->bark[lo]<=bi;lo++) ;
      p->barknoisewindowlo[i] = lo;
    }
  }

  /*_analysis_output("mediancurve",0,p->noisemedian,n,0,0);*/
}

void _vp_psy_clear(vorbis_look_psy *p){
  int i,j;
  if(p){
    if(p->ath)_ogg_free(p->ath);
    if(p->octave)_ogg_free(p->octave);
    if(p->bark)_ogg_free(p->bark);
    if(p->tonecurves){
      for(i=0;i<P_BANDS;i++){
	for(j=0;j<P_LEVELS;j++){
	  _ogg_free(p->tonecurves[i][j]);
	}
	_ogg_free(p->tonecurves[i]);
	_ogg_free(p->peakatt[i]);
      }
      _ogg_free(p->tonecurves);
      _ogg_free(p->noisemedian);
      _ogg_free(p->inoisemedian);
      _ogg_free(p->barknoisewindowlo);
      _ogg_free(p->barknoisewindowhi);
      _ogg_free(p->noiseoffset);
      _ogg_free(p->peakatt);
    }
    memset(p,0,sizeof(vorbis_look_psy));
  }
}

/* octave/(8*eighth_octave_lines) x scale and dB y scale */
static void seed_curve(float *seed,
		      float **curves,
		      float amp,
		      int oc,int n,int linesper,float dBoffset){
  int i;
  long seedptr;
  float *posts,*curve;
  int a,b;

  int choice=(int)((amp+dBoffset)*.1f);
  choice=max(choice,0);
  choice=min(choice,P_LEVELS-1);
  posts=curves[choice];
  a=posts[0];
  b=posts[1];
  curve=posts+2;
  seedptr=oc+(a-16)*linesper-(linesper>>1);

  for(i=a;i<b;i++){
    if(seedptr>0){
      float lin=amp+curve[i];
      if(seed[seedptr]<lin)seed[seedptr]=lin;
    }
    seedptr+=linesper;
    if(seedptr>=n)break;
  }
}

static void seed_peak(float *seed,
		      float *att,
		      float amp,
		      int oc,
		      int linesper,
		      float dBoffset){
  long seedptr;

  int choice=(int)((amp+dBoffset)*.1f);
  choice=max(choice,0);
  choice=min(choice,P_LEVELS-1);
  seedptr=oc-(linesper>>1);

  amp+=att[choice];
  if(seed[seedptr]<amp)seed[seedptr]=amp;

}

static void seed_loop(vorbis_look_psy *p,
		      float ***curves,
		      float **att,
		      float *f, 
		      float *flr,
		      float *minseed,
		      float *maxseed,
		      float specmax){
  vorbis_info_psy *vi=p->vi;
  long n=p->n,i;
  float dBoffset=vi->max_curve_dB-specmax;

  /* prime the working vector with peak values */

  for(i=0;i<n;i++){
      float max=f[i];
      long oc=p->octave[i];
      while(i+1<n && p->octave[i+1]==oc){
	i++;
	if(f[i]>max)max=f[i];
      }

      if(max>flr[i]){
	oc=oc>>p->shiftoc;
	if(oc>=P_BANDS)oc=P_BANDS-1;
	if(oc<0)oc=0;
	if(vi->tonemaskp)
	  seed_curve(minseed,
		     curves[oc],
		     max,
		     p->octave[i]-p->firstoc,
		     p->total_octave_lines,
		     p->eighth_octave_lines,
		     dBoffset);
	if(vi->peakattp)
	  seed_peak(maxseed,
		    att[oc],
		    max,
		    p->octave[i]-p->firstoc,
		    p->eighth_octave_lines,
		    dBoffset);
      }
  }
}

static void bound_loop(vorbis_look_psy *p,
		       float *f, 
		       float *seeds,
		       float *flr,
		       float att){
  long n=p->n,i;

  long off=(p->eighth_octave_lines>>1)+p->firstoc;
  long *ocp=p->octave;

  for(i=0;i<n;i++){
    long oc=ocp[i]-off;
    float v=f[i]+att;
    if(seeds[oc]<v)seeds[oc]=v;
  }
}

static void seed_chase(float *seeds, int linesper, long n){
  long  *posstack=alloca(n*sizeof(long));
  float *ampstack=alloca(n*sizeof(float));
  long   stack=0;
  long   pos=0;
  long   i;

  for(i=0;i<n;i++){
    if(stack<2){
      posstack[stack]=i;
      ampstack[stack++]=seeds[i];
    }else{
      while(1){
	if(seeds[i]<ampstack[stack-1]){
	  posstack[stack]=i;
	  ampstack[stack++]=seeds[i];
	  break;
	}else{
	  if(i<posstack[stack-1]+linesper){
	    if(stack>1 && ampstack[stack-1]<=ampstack[stack-2] &&
	       i<posstack[stack-2]+linesper){
	      /* we completely overlap, making stack-1 irrelevant.  pop it */
	      stack--;
	      continue;
	    }
	  }
	  posstack[stack]=i;
	  ampstack[stack++]=seeds[i];
	  break;

	}
      }
    }
  }

  /* the stack now contains only the positions that are relevant. Scan
     'em straight through */

  for(i=0;i<stack;i++){
    long endpos;
    if(i<stack-1 && ampstack[i+1]>ampstack[i]){
      endpos=posstack[i+1];
    }else{
      endpos=posstack[i]+linesper+1; /* +1 is important, else bin 0 is
					discarded in short frames */
    }
    if(endpos>n)endpos=n;
    for(;pos<endpos;pos++)
      seeds[pos]=ampstack[i];
  }
  
  /* there.  Linear time.  I now remember this was on a problem set I
     had in Grad Skool... I didn't solve it at the time ;-) */

}

/* bleaugh, this is more complicated than it needs to be */
static void max_seeds(vorbis_look_psy *p,float *minseed,float *maxseed,
		      float *flr){
  long   n=p->total_octave_lines;
  int    linesper=p->eighth_octave_lines;
  long   linpos=0;
  long   pos;

  seed_chase(minseed,linesper,n); /* for masking */
  seed_chase(maxseed,linesper,n); /* for peak att */
 
  pos=p->octave[0]-p->firstoc-(linesper>>1);
  while(linpos+1<p->n){
    float min=minseed[pos];
    float max=maxseed[pos];
    long end=((p->octave[linpos]+p->octave[linpos+1])>>1)-p->firstoc;
    while(pos+1<=end){
      pos++;
      if((minseed[pos]>NEGINF && minseed[pos]<min) || min==NEGINF)
	min=minseed[pos];
      if(maxseed[pos]>max)max=maxseed[pos];
    }
    if(max<min)max=min;
    
    /* seed scale is log.  Floor is linear.  Map back to it */
    end=pos+p->firstoc;
    for(;linpos<p->n && p->octave[linpos]<=end;linpos++)
      if(flr[linpos]<max)flr[linpos]=max;
  }
  
  {
    float min=minseed[p->total_octave_lines-1];
    float max=maxseed[p->total_octave_lines-1];
    if(max<min)max=min;
    for(;linpos<p->n;linpos++)
      if(flr[linpos]<max)flr[linpos]=max;
  }
  
}

/* quarter-dB bins */
#define BIN(x)   ((int)((x)*negFour))
#define BINdB(x) ((x)*negQuarter)
#define BINCOUNT (200*4)
#define LASTBIN  (BINCOUNT-1)

static void old_bark_noise_median(long n,float *b,float *f,float *noise,
			      float lowidth,float hiwidth,
			      int lomin,int himin,
			      float *thresh,float *off){
  long i=0,lo=0,hi=0;
  float bi,threshi;
  long median=LASTBIN;
  float negFour = -4.0f;
  float negQuarter = -0.25f;

   /* these are really integral values, but we store them in floats to
      avoid excessive float/int conversions, which GCC and MSVC are
      farily poor at optimizing. */

  float radix[BINCOUNT];
  float countabove=0;
  float countbelow=0;

  memset(radix,0,sizeof(radix));

  for(i=0;i<n;i++){
    /* find new lo/hi */
    bi=b[i]+hiwidth;
    for(;hi<n && (hi<i+himin || b[hi]<=bi);hi++){
      int bin=BIN(f[hi]);
      if(bin>LASTBIN)bin=LASTBIN;
      if(bin<0)bin=0;
      radix[bin]++;
      if(bin<median)
	countabove++;
      else
	countbelow++;
    }
//fprintf(stderr, "%d: %d, ", i, hi);
    bi=b[i]-lowidth;
    for(;lo<i && lo+lomin<i && b[lo]<=bi;lo++){
      int bin=BIN(f[lo]);
      if(bin>LASTBIN)bin=LASTBIN;
      if(bin<0)bin=0;
      radix[bin]--;
      if(bin<median)
	countabove--;
      else
	countbelow--;
    }
//fprintf(stderr, "%d\n", lo);

    /* move the median if needed */
//    if(countabove+countbelow){
      threshi = thresh[i]*(countabove+countbelow);

      while(threshi>countbelow && median>0){
	median--;
	countabove-=radix[median];
	countbelow+=radix[median];
      }

      while(threshi<(countbelow-radix[median]) &&
	    median<LASTBIN){
	countabove+=radix[median];
	countbelow-=radix[median];
	median++;
      }
//    }
    noise[i]=BINdB(median)+off[i];
  }
//exit(1);
}

static void bark_noise_median(long n,float *b,float *f,float *noise,
			      float lowidth,float hiwidth,
			      int lomin,int himin,
			      float *thresh,int *ithresh,int *bhi, int *blo, float *off){
  long i=0,lo=0,hi=0;
//  float bi;
int threshi;
  long median=LASTBIN;
  float negFour = -4.0f;
  float negQuarter = -0.25f;

  int radix[BINCOUNT];
  int countabove=0;
  int countbelow=0;

//old_bark_noise_median(n,b,f,noise,lowidth,hiwidth,lomin,himin,thresh,off);return;
  memset(radix,0,sizeof(radix));

  for(i=0;i<n;i++){
    /* find new lo/hi */
//    bi=b[i]+hiwidth;
//    for(;hi<n && (hi<i+himin || b[hi]<=bi);hi++){
    for(;hi<bhi[i];hi++){
      int bin=BIN(f[hi]);
      if(bin>LASTBIN)bin=LASTBIN;
      if(bin<0)bin=0;
      radix[bin]++;
//countabove += (bin < median);
//countbelow += (bin >= median);
      if(bin<median)
	countabove++;
    else
	countbelow++;
    }
//fprintf(stderr, "%d: %d, ", i, hi);
//    bi=b[i]-lowidth;
//    for(;lo<i && lo+lomin<i && b[lo]<=bi;lo++){
    for(;lo<blo[i];lo++){
      int bin=BIN(f[lo]);
      if(bin>LASTBIN)bin=LASTBIN;
      if(bin<0)bin=0;
      radix[bin]--;
//countabove -= (bin < median);
//countbelow -= (bin >= median);
      if(bin<median)
	countabove--;
      else
	countbelow--;
    }
//fprintf(stderr, "%d\n", lo);

    /* move the median if needed */
//      threshi = thresh[i]*(countabove+countbelow);
//      threshi = (ithresh[i]*(countabove+countbelow)+32768)>>16;
      threshi = (ithresh[i]*(countabove+countbelow))>>16;
//!fprintf(stderr, "%f %f\n", (float)threshi, thresh[i]*(countabove+countbelow));
//if(n==1024)fprintf(stderr, "%f\n", thresh[i]);
      while(threshi>countbelow && median>0){
	median--;
	countabove-=radix[median];
	countbelow+=radix[median];
      }

      while(threshi<(countbelow-radix[median]) &&
	    median<LASTBIN){
	countabove+=radix[median];
	countbelow-=radix[median];
	median++;
      }
    noise[i]=BINdB(median)+off[i];
  }
//if(n==1024)exit(1);
//!exit(1);
}

float _vp_compute_mask(vorbis_look_psy *p,
		      float *fft, 
		      float *mdct, 
		      float *flr, 
		      float *decay,
		      float specmax){
  int i,n=p->n;
  float localmax=NEGINF;
  static int seq=0;

  float *minseed=alloca(sizeof(float)*p->total_octave_lines);
  float *maxseed=alloca(sizeof(float)*p->total_octave_lines);
  for(i=0;i<p->total_octave_lines;i++)minseed[i]=maxseed[i]=NEGINF;

  /* go to dB scale. Also find the highest peak so we know the limits */
  for(i=0;i<n;i++){
    fft[i]=todB_t(fft[i]);
    if(fft[i]>localmax)localmax=fft[i];
  }
  if(specmax<localmax)specmax=localmax;


  for(i=0;i<n;i++){
    mdct[i]=todB_t(mdct[i]);
  }

  _analysis_output("mdct",seq,mdct,n,0,0);
  _analysis_output("fft",seq,fft,n,0,0);

  /* noise masking */
  if(p->vi->noisemaskp){
    bark_noise_median(n,p->bark,mdct,flr,
		      p->vi->noisewindowlo,
		      p->vi->noisewindowhi,
		      p->vi->noisewindowlomin,
		      p->vi->noisewindowhimin,
		      p->noisemedian,
		      p->inoisemedian,
		      p->barknoisewindowhi,
		      p->barknoisewindowlo,
		      p->noiseoffset);
    /* suppress any noise curve > specmax+p->vi->noisemaxsupp */
    for(i=0;i<n;i++)
      if(flr[i]>specmax+p->vi->noisemaxsupp)
	flr[i]=specmax+p->vi->noisemaxsupp;
    _analysis_output("noise",seq,flr,n,0,0);
  }else{
    for(i=0;i<n;i++)flr[i]=NEGINF;
  }

  /* set the ATH (floating below localmax, not global max by a
     specified att) */
  if(p->vi->athp){
    float att=localmax+p->vi->ath_adjatt;
    if(att<p->vi->ath_maxatt)att=p->vi->ath_maxatt;

    for(i=0;i<n;i++){
      float av=p->ath[i]+att;
      if(av>flr[i])flr[i]=av;
    }
  }

  _analysis_output("ath",seq,flr,n,0,0);

  /* tone/peak masking */

  /* XXX apply decay to the fft here */

  seed_loop(p,p->tonecurves,p->peakatt,fft,flr,minseed,maxseed,specmax);
  bound_loop(p,mdct,maxseed,flr,p->vi->bound_att_dB);
  _analysis_output("minseed",seq,minseed,p->total_octave_lines,0,0);
  _analysis_output("maxseed",seq,maxseed,p->total_octave_lines,0,0);
  max_seeds(p,minseed,maxseed,flr);
  _analysis_output("final",seq,flr,n,0,0);

  /* doing this here is clean, but we need to find a faster way to do
     it than to just tack it on */

  for(i=0;i<n;i++)if(mdct[i]>=flr[i])break;
  if(i==n)for(i=0;i<n;i++)flr[i]=NEGINF;


  seq++;

  return(specmax);
}


/* this applies the floor and (optionally) tries to preserve noise
   energy in low resolution portions of the spectrum */
/* f and flr are *linear* scale, not dB */
void _vp_apply_floor(vorbis_look_psy *p,float *f, float *flr){
  float *work=alloca(p->n*sizeof(float));
  int j;

  /* subtract the floor */
  for(j=0;j<p->n;j++){
    if(flr[j]<=0)
      work[j]=0.f;
    else
      work[j]=f[j]/flr[j];
  }

  memcpy(f,work,p->n*sizeof(float));
}

float _vp_ampmax_decay(float amp,vorbis_dsp_state *vd){
  vorbis_info *vi=vd->vi;
  codec_setup_info *ci=vi->codec_setup;
  int n=ci->blocksizes[vd->W]/2;
  float secs=(float)n/vi->rate;

  amp+=secs*ci->ampmax_att_per_sec;
  if(amp<-9999)amp=-9999;
  return(amp);
}