Home | History | Annotate | Download | only in lib
      1 /********************************************************************
      2  *                                                                  *
      3  * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE.   *
      4  * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS     *
      5  * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE *
      6  * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING.       *
      7  *                                                                  *
      8  * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2007             *
      9  * by the Xiph.Org Foundation http://www.xiph.org/                  *
     10  *                                                                  *
     11  ********************************************************************
     12 
     13  function: simple utility that runs audio through the psychoacoustics
     14            without encoding
     15  last mod: $Id: psytune.c 16037 2009-05-26 21:10:58Z xiphmont $
     16 
     17  ********************************************************************/
     18 
     19 /* NB: this is dead code, retained purely for doc and reference value
     20        don't try to compile it */
     21 
     22 #include <stdio.h>
     23 #include <stdlib.h>
     24 #include <string.h>
     25 #include <math.h>
     26 
     27 #include "vorbis/codec.h"
     28 #include "codec_internal.h"
     29 #include "os.h"
     30 #include "misc.h"
     31 #include "psy.h"
     32 #include "mdct.h"
     33 #include "smallft.h"
     34 #include "window.h"
     35 #include "scales.h"
     36 #include "lpc.h"
     37 #include "lsp.h"
     38 #include "masking.h"
     39 #include "registry.h"
     40 
     41 static vorbis_info_psy_global _psy_set0G={
     42   0,   /* decaydBpms */
     43   8,   /* lines per eighth octave */
     44 
     45   /* thresh sample period, preecho clamp trigger threshhold, range, minenergy */
     46   256, {26.f,26.f,26.f,30.f}, {-90.f,-90.f,-90.f,-90.f}, -90.f,
     47   -6.f,
     48 
     49   0,
     50 
     51   0.,
     52   0.,
     53 };
     54 
     55 static vp_part _vp_part0[]={
     56   {    1,9e10f, 9e10f,       1.f,9999.f},
     57   { 9999,  .75f, 9e10f,       .5f,9999.f},
     58 /*{ 9999, 1.5f, 9e10f,       .5f,9999.f},*/
     59   {   18,9e10f, 9e10f,       .5f,  30.f},
     60   { 9999,9e10f, 9e10f,       .5f,  30.f}
     61 };
     62 
     63 static vp_couple _vp_couple0[]={
     64   {    1,  {9e10f,9e10f,0}, {   0.f,   0.f,0}, {   0.f, 0.f,0}, {0.f,0.f,0}},
     65   {   18,  {9e10f,9e10f,0}, {   0.f,   0.f,0}, {   0.f, 0.f,0}, {0.f,0.f,0}},
     66   { 9999,  {9e10f,9e10f,0}, {   0.f, 9e10f,0}, {   0.f,22.f,1}, {0.f,0.f,0}}
     67 };
     68 
     69 static vorbis_info_psy _psy_set0={
     70   ATH_Bark_dB_lineaggressive,
     71 
     72   -100.f,
     73   -140.f,
     74   6.f, /* floor master att */
     75 
     76   /*     0  1  2   3   4   5   6   7   8   9  10  11  12  13  14  15   16   */
     77   /* x: 63 88 125 175 250 350 500 700 1k 1.4k 2k 2.8k 4k 5.6k 8k 11.5k 16k Hz */
     78   /* y: 0 10 20 30 40 50 60 70 80 90 100 dB */
     79    1,  /* tonemaskp */
     80   0.f, /* tone master att */
     81   /*  0   10   20   30   40   50   60   70   80   90   100 */
     82   {
     83    {-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f}, /*63*/
     84    {-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f}, /*88*/
     85    {-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f}, /*125*/
     86 
     87    {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*175*/
     88    {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*250*/
     89    {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*350*/
     90    {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*500*/
     91    {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*700*/
     92    {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*1000*/
     93    {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*1400*/
     94    {-40.f,-40.f,-40.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*2000*/
     95    {-40.f,-40.f,-40.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*2800*/
     96    {-40.f,-40.f,-40.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*4000*/
     97 
     98    {-30.f,-35.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*5600*/
     99 
    100    {-30.f,-30.f,-33.f,-35.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*8000*/
    101    {-30.f,-30.f,-33.f,-35.f,-40.f,-45.f,-50.f,-60.f,-70.f,-85.f,-100.f}, /*11500*/
    102    {-24.f,-24.f,-26.f,-32.f,-32.f,-42.f,-50.f,-60.f,-70.f,-85.f,-100.f}, /*16000*/
    103 
    104   },
    105 
    106   1,/* peakattp */
    107   {{-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*63*/
    108    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*88*/
    109    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*125*/
    110    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*175*/
    111    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*250*/
    112    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*350*/
    113    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*500*/
    114    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*700*/
    115    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*1000*/
    116    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*1400*/
    117    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*2000*/
    118    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*2800*/
    119    {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*4000*/
    120    {-10.f,-12.f,-14.f,-16.f,-16.f,-20.f,-24.f,-30.f,-32.f,-40.f,-40.f},/*5600*/
    121    {-10.f,-12.f,-14.f,-16.f,-16.f,-20.f,-24.f,-30.f,-32.f,-40.f,-40.f},/*8000*/
    122    {-10.f,-10.f,-10.f,-12.f,-14.f,-18.f,-22.f,-28.f,-32.f,-40.f,-40.f},/*11500*/
    123    {-10.f,-10.f,-10.f,-12.f,-14.f,-18.f,-22.f,-28.f,-32.f,-40.f,-40.f},/*16000*/
    124   },
    125 
    126   1,/*noisemaskp */
    127   -10.f,  /* suppress any noise curve over maxspec+n */
    128   .5f,   /* low window */
    129   .5f,   /* high window */
    130   10,
    131   10,
    132   25,
    133   {.000f, 0.f, /*63*/
    134    .000f, 0.f, /*88*/
    135    .000f, 0.f, /*125*/
    136    .000f, 0.f, /*175*/
    137    .000f, 0.f, /*250*/
    138    .000f, 0.f, /*350*/
    139    .000f, 0.f, /*500*/
    140    .000f, 0.f, /*700*/
    141    .000f, 0.f, /*1000*/
    142    .300f, 0.f, /*1400*/
    143    .300f, 0.f, /*2000*/
    144    .300f, 0.f, /*2800*/
    145    .500f, 0.f, /*4000*/
    146    .700f, 0.f, /*5600*/
    147    .850f, 0.f, /*8000*/
    148    .900f, 0.f, /*11500*/
    149    .900f, 1.f, /*16000*/
    150   },
    151 
    152   95.f,  /* even decade + 5 is important; saves an rint() later in a
    153             tight loop) */
    154   -44.,
    155 
    156   32,
    157   _vp_part0,_vp_couple0
    158 };
    159 
    160 static vorbis_info_floor1 _floor_set0={1,
    161                                         {0},
    162 
    163                                         {32},
    164                                         {0},
    165                                         {0},
    166                                         {{-1}},
    167 
    168                                         2,
    169                                         {0,1024,
    170 
    171                                          88,31,243,
    172 
    173                                          14,54,143,460,
    174 
    175                                          6,3,10, 22,18,26, 41,36,47,
    176                                          69,61,78, 112,99,126, 185,162,211,
    177                                          329,282,387, 672,553,825
    178                                          },
    179 
    180                                         60,30,400,
    181                                         20,8,1,18.,
    182                                         20,600,
    183                                         960};
    184 
    185 
    186 static vorbis_info_mapping0 mapping_info={1,{0,1},{0},{0},{0},0, 1, {0},{1}};
    187 static codec_setup_info codec_setup0={ {0,0},
    188                                        1,1,1,1,1,0,1,
    189                                        {NULL},
    190                                        {0},{&mapping_info},
    191                                        {0},{NULL},
    192                                        {1},{&_floor_set0},
    193                                        {2},{NULL},
    194                                        {NULL},
    195                                        {&_psy_set0},
    196                                        &_psy_set0G};
    197 
    198 static int noisy=0;
    199 void analysis(char *base,int i,float *v,int n,int bark,int dB){
    200   if(noisy){
    201     int j;
    202     FILE *of;
    203     char buffer[80];
    204     sprintf(buffer,"%s_%d.m",base,i);
    205     of=fopen(buffer,"w");
    206 
    207     for(j=0;j<n;j++){
    208       if(dB && v[j]==0)
    209           fprintf(of,"\n\n");
    210       else{
    211         if(bark)
    212           fprintf(of,"%g ",toBARK(22050.f*j/n));
    213         else
    214           fprintf(of,"%g ",(float)j);
    215 
    216         if(dB){
    217           fprintf(of,"%g\n",todB(v+j));
    218         }else{
    219           fprintf(of,"%g\n",v[j]);
    220         }
    221       }
    222     }
    223     fclose(of);
    224   }
    225 }
    226 
    227 long frameno=0;
    228 
    229 /****************************************************************/
    230 
    231 int main(int argc,char *argv[]){
    232   int eos=0;
    233   float nonz=0.f;
    234   float acc=0.f;
    235   float tot=0.f;
    236   float ampmax=-9999,newmax;
    237   float local_ampmax[2];
    238 
    239   int framesize=2048;
    240   float ampmax_att_per_sec=-6.;
    241 
    242   float *pcm[2],*out[2],*window,*flr[2],*mask[2],*work[2];
    243   signed char *buffer,*buffer2;
    244   mdct_lookup m_look;
    245   drft_lookup f_look;
    246   vorbis_look_psy p_look;
    247   vorbis_look_psy_global *pg_look;
    248   vorbis_look_floor *floor_look;
    249   vorbis_info vi;
    250   long i,j,k;
    251 
    252   int ath=0;
    253   int decayp=0;
    254 
    255   argv++;
    256   while(*argv){
    257     if(*argv[0]=='-'){
    258       /* option */
    259       if(argv[0][1]=='v'){
    260         noisy=0;
    261       }
    262     }else
    263       if(*argv[0]=='+'){
    264         /* option */
    265         if(argv[0][1]=='v'){
    266           noisy=1;
    267         }
    268       }else
    269         framesize=atoi(argv[0]);
    270     argv++;
    271   }
    272 
    273   vi.channels=2;
    274   vi.codec_setup=&codec_setup0;
    275 
    276   pcm[0]=_ogg_malloc(framesize*sizeof(float));
    277   pcm[1]=_ogg_malloc(framesize*sizeof(float));
    278   out[0]=_ogg_calloc(framesize/2,sizeof(float));
    279   out[1]=_ogg_calloc(framesize/2,sizeof(float));
    280   work[0]=_ogg_calloc(framesize,sizeof(float));
    281   work[1]=_ogg_calloc(framesize,sizeof(float));
    282   flr[0]=_ogg_calloc(framesize/2,sizeof(float));
    283   flr[1]=_ogg_calloc(framesize/2,sizeof(float));
    284   buffer=_ogg_malloc(framesize*4);
    285   buffer2=buffer+framesize*2;
    286   window=_vorbis_window_create(0,framesize,framesize/2,framesize/2);
    287   mdct_init(&m_look,framesize);
    288   drft_init(&f_look,framesize);
    289   _vp_psy_init(&p_look,&_psy_set0,&_psy_set0G,framesize/2,44100);
    290   pg_look=_vp_global_look(&vi);
    291   floor_look=_floor_P[1]->look(NULL,NULL,&_floor_set0);
    292 
    293   /* we cheat on the WAV header; we just bypass 44 bytes and never
    294      verify that it matches 16bit/stereo/44.1kHz. */
    295 
    296   fread(buffer,1,44,stdin);
    297   fwrite(buffer,1,44,stdout);
    298   memset(buffer,0,framesize*2);
    299 
    300   analysis("window",0,window,framesize,0,0);
    301 
    302   fprintf(stderr,"Processing for frame size %d...\n",framesize);
    303 
    304   while(!eos){
    305     long bytes=fread(buffer2,1,framesize*2,stdin);
    306     if(bytes<framesize*2)
    307       memset(buffer2+bytes,0,framesize*2-bytes);
    308 
    309     if(bytes!=0){
    310       int nonzero[2];
    311 
    312       /* uninterleave samples */
    313       for(i=0;i<framesize;i++){
    314         pcm[0][i]=((buffer[i*4+1]<<8)|
    315                       (0x00ff&(int)buffer[i*4]))/32768.f;
    316         pcm[1][i]=((buffer[i*4+3]<<8)|
    317                    (0x00ff&(int)buffer[i*4+2]))/32768.f;
    318       }
    319 
    320       {
    321         float secs=framesize/44100.;
    322 
    323         ampmax+=secs*ampmax_att_per_sec;
    324         if(ampmax<-9999)ampmax=-9999;
    325       }
    326 
    327       for(i=0;i<2;i++){
    328         float scale=4.f/framesize;
    329         float *fft=work[i];
    330         float *mdct=pcm[i];
    331         float *logmdct=mdct+framesize/2;
    332 
    333         analysis("pre",frameno+i,pcm[i],framesize,0,0);
    334 
    335         /* fft and mdct transforms  */
    336         for(j=0;j<framesize;j++)
    337           fft[j]=pcm[i][j]*=window[j];
    338 
    339         drft_forward(&f_look,fft);
    340 
    341         local_ampmax[i]=-9999.f;
    342         fft[0]*=scale;
    343         fft[0]=todB(fft);
    344         for(j=1;j<framesize-1;j+=2){
    345           float temp=scale*FAST_HYPOT(fft[j],fft[j+1]);
    346           temp=fft[(j+1)>>1]=todB(&temp);
    347           if(temp>local_ampmax[i])local_ampmax[i]=temp;
    348         }
    349         if(local_ampmax[i]>ampmax)ampmax=local_ampmax[i];
    350 
    351         mdct_forward(&m_look,pcm[i],mdct);
    352         for(j=0;j<framesize/2;j++)
    353           logmdct[j]=todB(mdct+j);
    354 
    355         analysis("mdct",frameno+i,logmdct,framesize/2,1,0);
    356         analysis("fft",frameno+i,fft,framesize/2,1,0);
    357       }
    358 
    359       for(i=0;i<2;i++){
    360         float amp;
    361         float *fft=work[i];
    362         float *logmax=fft;
    363         float *mdct=pcm[i];
    364         float *logmdct=mdct+framesize/2;
    365         float *mask=fft+framesize/2;
    366 
    367         /* floor psychoacoustics */
    368         _vp_compute_mask(&p_look,
    369                          pg_look,
    370                          i,
    371                          fft,
    372                          logmdct,
    373                          mask,
    374                          ampmax,
    375                          local_ampmax[i],
    376                          framesize/2);
    377 
    378         analysis("mask",frameno+i,mask,framesize/2,1,0);
    379 
    380         {
    381           vorbis_block vb;
    382           vorbis_dsp_state vd;
    383           memset(&vd,0,sizeof(vd));
    384           vd.vi=&vi;
    385           vb.vd=&vd;
    386           vb.pcmend=framesize;
    387 
    388           /* floor quantization/application */
    389           nonzero[i]=_floor_P[1]->forward(&vb,floor_look,
    390                                           mdct,
    391                                           logmdct,
    392                                           mask,
    393                                           logmax,
    394 
    395                                           flr[i]);
    396         }
    397 
    398         _vp_remove_floor(&p_look,
    399                          pg_look,
    400                          logmdct,
    401                          mdct,
    402                          flr[i],
    403                          pcm[i],
    404                          local_ampmax[i]);
    405 
    406         for(j=0;j<framesize/2;j++)
    407           if(fabs(pcm[i][j])>1500)
    408             fprintf(stderr,"%ld ",frameno+i);
    409 
    410         analysis("res",frameno+i,pcm[i],framesize/2,1,0);
    411         analysis("codedflr",frameno+i,flr[i],framesize/2,1,1);
    412       }
    413 
    414       /* residue prequantization */
    415       _vp_partition_prequant(&p_look,
    416                              &vi,
    417                              pcm,
    418                              nonzero);
    419 
    420       for(i=0;i<2;i++)
    421         analysis("quant",frameno+i,pcm[i],framesize/2,1,0);
    422 
    423       /* channel coupling / stereo quantization */
    424 
    425       _vp_couple(&p_look,
    426                  &mapping_info,
    427                  pcm,
    428                  nonzero);
    429 
    430       for(i=0;i<2;i++)
    431         analysis("coupled",frameno+i,pcm[i],framesize/2,1,0);
    432 
    433       /* decoupling */
    434       for(i=mapping_info.coupling_steps-1;i>=0;i--){
    435         float *pcmM=pcm[mapping_info.coupling_mag[i]];
    436         float *pcmA=pcm[mapping_info.coupling_ang[i]];
    437 
    438         for(j=0;j<framesize/2;j++){
    439           float mag=pcmM[j];
    440           float ang=pcmA[j];
    441 
    442           if(mag>0)
    443             if(ang>0){
    444               pcmM[j]=mag;
    445               pcmA[j]=mag-ang;
    446             }else{
    447               pcmA[j]=mag;
    448               pcmM[j]=mag+ang;
    449             }
    450           else
    451             if(ang>0){
    452               pcmM[j]=mag;
    453               pcmA[j]=mag+ang;
    454             }else{
    455               pcmA[j]=mag;
    456               pcmM[j]=mag-ang;
    457             }
    458         }
    459       }
    460 
    461       for(i=0;i<2;i++)
    462         analysis("decoupled",frameno+i,pcm[i],framesize/2,1,0);
    463 
    464       for(i=0;i<2;i++){
    465         float amp;
    466 
    467         for(j=0;j<framesize/2;j++)
    468           pcm[i][j]*=flr[i][j];
    469 
    470         analysis("final",frameno+i,pcm[i],framesize/2,1,1);
    471 
    472         /* take it back to time */
    473         mdct_backward(&m_look,pcm[i],pcm[i]);
    474 
    475         for(j=0;j<framesize/2;j++)
    476           out[i][j]+=pcm[i][j]*window[j];
    477 
    478         analysis("out",frameno+i,out[i],framesize/2,0,0);
    479 
    480 
    481       }
    482 
    483       /* write data.  Use the part of buffer we're about to shift out */
    484       for(i=0;i<2;i++){
    485         char  *ptr=buffer+i*2;
    486         float *mono=out[i];
    487         int flag=0;
    488         for(j=0;j<framesize/2;j++){
    489           int val=mono[j]*32767.;
    490           /* might as well guard against clipping */
    491           if(val>32767){
    492             if(!flag)fprintf(stderr,"clipping in frame %ld ",frameno+i);
    493             flag=1;
    494             val=32767;
    495           }
    496           if(val<-32768){
    497             if(!flag)fprintf(stderr,"clipping in frame %ld ",frameno+i);
    498             flag=1;
    499             val=-32768;
    500           }
    501           ptr[0]=val&0xff;
    502           ptr[1]=(val>>8)&0xff;
    503           ptr+=4;
    504         }
    505       }
    506 
    507       fprintf(stderr,"*");
    508       fwrite(buffer,1,framesize*2,stdout);
    509       memmove(buffer,buffer2,framesize*2);
    510 
    511       for(i=0;i<2;i++){
    512         for(j=0,k=framesize/2;j<framesize/2;j++,k++)
    513           out[i][j]=pcm[i][k]*window[k];
    514       }
    515       frameno+=2;
    516     }else
    517       eos=1;
    518   }
    519   fprintf(stderr,"average raw bits of entropy: %.03g/sample\n",acc/tot);
    520   fprintf(stderr,"average nonzero samples: %.03g/%d\n",nonz/tot*framesize/2,
    521           framesize/2);
    522   fprintf(stderr,"Done\n\n");
    523   return 0;
    524 }
    525