xiph
/
vorbis
mirror of https://git.xiph.org/vorbis.git


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366
							/********************************************************************
 *                                                                  *
 * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE.   *
 * USE, DISTRIBUTION AND REPRODUCTION OF THIS SOURCE IS GOVERNED BY *
 * THE GNU LESSER/LIBRARY PUBLIC LICENSE, WHICH IS INCLUDED WITH    *
 * THIS SOURCE. PLEASE READ THESE TERMS BEFORE DISTRIBUTING.        *
 *                                                                  *
 * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2000             *
 * by Monty <monty@xiph.org> and the XIPHOPHORUS Company            *
 * http://www.xiph.org/                                             *
 *                                                                  *
 ********************************************************************

 function: normalized modified discrete cosine transform
           power of two length transform only [16 <= n ]
 last mod: $Id: mdct.c,v 1.17.2.5 2000/11/04 06:43:50 xiphmont Exp $

 Algorithm adapted from _The use of multirate filter banks for coding
 of high quality digital audio_, by T. Sporer, K. Brandenburg and
 B. Edler, collection of the European Signal Processing Conference
 (EUSIPCO), Amsterdam, June 1992, Vol.1, pp 211-214 

 Note that the below code won't make much sense without the paper;
 The presented algorithm was already fairly polished, and the code
 once followed it closely.  The current code both corrects several
 typos in the paper and goes beyond the presented optimizations 
 (steps 4 through 6 are, for example, entirely eliminated).

 This module DOES NOT INCLUDE code to generate the window function.
 Everybody has their own weird favorite including me... I happen to
 like the properties of y=sin(2PI*sin^2(x)), but others may vehemently
 disagree.

 ********************************************************************/

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <math.h>
#include "mdct.h"
#include "os.h"
#include "misc.h"

/* build lookups for trig functions; also pre-figure scaling and
   some window function algebra. */

void mdct_init(mdct_lookup *lookup,int n){
  int    *bitrev=_ogg_malloc(sizeof(int)*(n/4));
  float *trig=_ogg_malloc(sizeof(float)*(n+n/4));
  float *AE=trig;
  float *AO=trig+1;
  float *BE=AE+n/2;
  float *BO=BE+1;
  float *CE=BE+n/2;
  float *CO=CE+1;
  
  int i;
  int log2n=lookup->log2n=rint(log(n)/log(2));
  lookup->n=n;
  lookup->trig=trig;
  lookup->bitrev=bitrev;

  /* trig lookups... */

  for(i=0;i<n/4;i++){
    AE[i*2]=cos((M_PI/n)*(4*i));
    AO[i*2]=-sin((M_PI/n)*(4*i));
    BE[i*2]=cos((M_PI/(2*n))*(2*i+1));
    BO[i*2]=sin((M_PI/(2*n))*(2*i+1));
  }
  for(i=0;i<n/8;i++){
    CE[i*2]=cos((M_PI/n)*(4*i+2));
    CO[i*2]=-sin((M_PI/n)*(4*i+2));
  }

  /* bitreverse lookup... */

  {
    int mask=(1<<(log2n-1))-1,i,j;
    int msb=1<<(log2n-2);
    for(i=0;i<n/8;i++){
      int acc=0;
      for(j=0;msb>>j;j++)
	if((msb>>j)&i)acc|=1<<j;
      bitrev[i*2]=((~acc)&mask);
      bitrev[i*2+1]=acc;
    }
  }
}

void mdct_clear(mdct_lookup *l){
  if(l){
    if(l->trig)free(l->trig);
    if(l->bitrev)free(l->bitrev);
    memset(l,0,sizeof(mdct_lookup));
  }
}

static float *_mdct_kernel(float *x, float *w,
			    int n, int n2, int n4, int n8,
			    mdct_lookup *init){
  int i;
  /* step 2 */

  {
    float *xA=x+n4;
    float *xB=x;
    float *w2=w+n4;
    float *A=init->trig+n2;

    float x0,x1;
    i=0;
    do{
      x0=*xA - *xB;
      w2[i]=    *xA++ + *xB++;
      x1=       *xA - *xB;
      A-=4;
      w[i++]=   x0 * A[0] + x1 * A[1];
      w[i]=     x1 * A[0] - x0 * A[1];
      w2[i++]=  *xA++ + *xB++;
    }while(i<n4);
  }

  /* step 3 */

  {
    int r,s;
    for(i=0;i<init->log2n-3;i++){
      int k0=n>>(i+2);
      int k1=1<<(i+3);
      int wbase=n2-2;
      float *A=init->trig;
      float *temp;

      for(r=0;r<(k0>>2);r++){
        int w1=wbase;
	int w2=w1-(k0>>1);
	float AEv= A[0],wA;
	float AOv= A[1],wB;
        int unroll=i;
	wbase-=2;

	k0++;
        unroll--;
        if(unroll>0){
          s=2<<unroll;
          s>>=1;
          do{
            wB     =w[w1]   -w[w2];
            x[w1]  =w[w1]   +w[w2];
            wA     =w[++w1] -w[++w2];
            x[w1]  =w[w1]   +w[w2];
            x[w2]  =wA*AEv  - wB*AOv;
            x[w2-1]=wB*AEv  + wA*AOv;
            w1-=k0;
            w2-=k0;
            wB     =w[w1]   -w[w2];
            x[w1]  =w[w1]   +w[w2];
            wA     =w[++w1] -w[++w2];
            x[w1]  =w[w1]   +w[w2];
            x[w2]  =wA*AEv  - wB*AOv;
            x[w2-1]=wB*AEv  + wA*AOv;
            w1-=k0;
            w2-=k0;
            wB     =w[w1]   -w[w2];
            x[w1]  =w[w1]   +w[w2];
            wA     =w[++w1] -w[++w2];
            x[w1]  =w[w1]   +w[w2];
            x[w2]  =wA*AEv  - wB*AOv;
            x[w2-1]=wB*AEv  + wA*AOv;
            w1-=k0;
            w2-=k0;
            wB     =w[w1]   -w[w2];
            x[w1]  =w[w1]   +w[w2];
            wA     =w[++w1] -w[++w2];
            x[w1]  =w[w1]   +w[w2];
            x[w2]  =wA*AEv  - wB*AOv;
            x[w2-1]=wB*AEv  + wA*AOv;
            w1-=k0;
            w2-=k0;
          }while(--s);
        }else{
          s=2<<i;
          do{
            wB     =w[w1]   -w[w2];
            x[w1]  =w[w1]   +w[w2];
            wA     =w[++w1] -w[++w2];
            x[w1]  =w[w1]   +w[w2];
            x[w2]  =wA*AEv  - wB*AOv;
            x[w2-1]=wB*AEv  + wA*AOv;
            w1-=k0;
            w2-=k0;
          }while(--s);
	}
	k0--;

	A+=k1;
      }

      temp=w;
      w=x;
      x=temp;
    }
  }

  /* step 4, 5, 6, 7 */
  {
    float *C=init->trig+n;
    int *bit=init->bitrev;
    float *x1=x;
    float *x2=x+n2-1;
    i=n8-1;
    do{
      int t1=*bit++;
      int t2=*bit++;

      float wA=w[t1]-w[t2+1];
      float wB=w[t1-1]+w[t2];
      float wC=w[t1]+w[t2+1];
      float wD=w[t1-1]-w[t2];

      float wACE=wA* *C;
      float wBCE=wB* *C++;
      float wACO=wA* *C;
      float wBCO=wB* *C++;
      
      *x1++=( wC+wACO+wBCE)*.5;
      *x2--=(-wD+wBCO-wACE)*.5;
      *x1++=( wD+wBCO-wACE)*.5; 
      *x2--=( wC-wACO-wBCE)*.5;
    }while(i--);
  }
  return(x);
}

void mdct_forward(mdct_lookup *init, float *in, float *out){
  int n=init->n;
  float *x=alloca(sizeof(float)*(n/2));
  float *w=alloca(sizeof(float)*(n/2));
  float *xx;
  int n2=n>>1;
  int n4=n>>2;
  int n8=n>>3;
  int i;

  /* window + rotate + step 1 */
  {
    float tempA,tempB;
    int in1=n2+n4-4;
    int in2=in1+5;
    float *A=init->trig+n2;

    i=0;
    
    for(i=0;i<n8;i+=2){
      A-=2;
      tempA= in[in1+2] + in[in2];
      tempB= in[in1] + in[in2+2];       
      in1 -=4;in2 +=4;
      x[i]=   tempB*A[1] + tempA*A[0];
      x[i+1]= tempB*A[0] - tempA*A[1];
    }

    in2=1;

    for(;i<n2-n8;i+=2){
      A-=2;
      tempA= in[in1+2] - in[in2];
      tempB= in[in1] - in[in2+2];       
      in1 -=4;in2 +=4;
      x[i]=   tempB*A[1] + tempA*A[0];
      x[i+1]= tempB*A[0] - tempA*A[1];
    }
    
    in1=n-4;

    for(;i<n2;i+=2){
      A-=2;
      tempA= -in[in1+2] - in[in2];
      tempB= -in[in1] - in[in2+2];       
      in1 -=4;in2 +=4;
      x[i]=   tempB*A[1] + tempA*A[0];
      x[i+1]= tempB*A[0] - tempA*A[1];
    }
  }

  xx=_mdct_kernel(x,w,n,n2,n4,n8,init);

  /* step 8 */

  {
    float *B=init->trig+n2;
    float *out2=out+n2;
    float scale=4./n;
    for(i=0;i<n4;i++){
      out[i]   =(xx[0]*B[0]+xx[1]*B[1])*scale;
      *(--out2)=(xx[0]*B[1]-xx[1]*B[0])*scale;

      xx+=2;
      B+=2;
    }
  }
}

void mdct_backward(mdct_lookup *init, float *in, float *out){
  int n=init->n;
  float *x=alloca(sizeof(float)*(n/2));
  float *w=alloca(sizeof(float)*(n/2));
  float *xx;
  int n2=n>>1;
  int n4=n>>2;
  int n8=n>>3;
  int i;

  /* rotate + step 1 */
  {
    float *inO=in+1;
    float  *xO= x;
    float  *A=init->trig+n2;

    for(i=0;i<n8;i++){
      A-=2;
      *xO++=-*(inO+2)*A[1] - *inO*A[0];
      *xO++= *inO*A[1] - *(inO+2)*A[0];
      inO+=4;
    }

    inO=in+n2-4;

    for(i=0;i<n8;i++){
      A-=2;
      *xO++=*inO*A[1] + *(inO+2)*A[0];
      *xO++=*inO*A[0] - *(inO+2)*A[1];
      inO-=4;
    }

  }

  xx=_mdct_kernel(x,w,n,n2,n4,n8,init);

  /* step 8 */

  {
    float *B=init->trig+n2;
    int o1=n4,o2=o1-1;
    int o3=n4+n2,o4=o3-1;
    
    for(i=0;i<n4;i++){
      float temp1= (*xx * B[1] - *(xx+1) * B[0]);
      float temp2=-(*xx * B[0] + *(xx+1) * B[1]);
    
      out[o1]=-temp1;
      out[o2]= temp1;
      out[o3]= temp2;
      out[o4]= temp2;

      o1++;
      o2--;
      o3++;
      o4--;
      xx+=2;
      B+=2;
    }
  }
}