1 /********************************************************************
3 * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE. *
4 * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS *
5 * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE *
6 * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING. *
8 * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2002 *
9 * by the XIPHOPHORUS Company http://www.xiph.org/ *
11 ********************************************************************
13 function: simple utility that runs audio through the psychoacoustics
15 last mod: $Id: psytune.c,v 1.20 2003/03/04 21:22:11 xiphmont Exp $
17 ********************************************************************/
24 #include "vorbis/codec.h"
25 #include "codec_internal.h"
38 static vorbis_info_psy_global _psy_set0G={
40 8, /* lines per eighth octave */
42 /* thresh sample period, preecho clamp trigger threshhold, range, minenergy */
43 256, {26.f,26.f,26.f,30.f}, {-90.f,-90.f,-90.f,-90.f}, -90.f,
52 static vp_part _vp_part0[]={
53 { 1,9e10f, 9e10f, 1.f,9999.f},
54 { 9999, .75f, 9e10f, .5f,9999.f},
55 /*{ 9999, 1.5f, 9e10f, .5f,9999.f},*/
56 { 18,9e10f, 9e10f, .5f, 30.f},
57 { 9999,9e10f, 9e10f, .5f, 30.f}
60 static vp_couple _vp_couple0[]={
61 { 1, {9e10f,9e10f,0}, { 0.f, 0.f,0}, { 0.f, 0.f,0}, {0.f,0.f,0}},
62 { 18, {9e10f,9e10f,0}, { 0.f, 0.f,0}, { 0.f, 0.f,0}, {0.f,0.f,0}},
63 { 9999, {9e10f,9e10f,0}, { 0.f, 9e10f,0}, { 0.f,22.f,1}, {0.f,0.f,0}}
66 static vorbis_info_psy _psy_set0={
67 ATH_Bark_dB_lineaggressive,
71 6.f, /* floor master att */
73 /* 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 */
74 /* x: 63 88 125 175 250 350 500 700 1k 1.4k 2k 2.8k 4k 5.6k 8k 11.5k 16k Hz */
75 /* y: 0 10 20 30 40 50 60 70 80 90 100 dB */
77 0.f, /* tone master att */
78 /* 0 10 20 30 40 50 60 70 80 90 100 */
80 {-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f}, /*63*/
81 {-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f}, /*88*/
82 {-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f,-999.f}, /*125*/
84 {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*175*/
85 {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*250*/
86 {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*350*/
87 {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*500*/
88 {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*700*/
89 {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*1000*/
90 {-30.f,-30.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*1400*/
91 {-40.f,-40.f,-40.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*2000*/
92 {-40.f,-40.f,-40.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*2800*/
93 {-40.f,-40.f,-40.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*4000*/
95 {-30.f,-35.f,-35.f,-40.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*5600*/
97 {-30.f,-30.f,-33.f,-35.f,-40.f,-50.f,-60.f,-70.f,-80.f,-90.f,-100.f}, /*8000*/
98 {-30.f,-30.f,-33.f,-35.f,-40.f,-45.f,-50.f,-60.f,-70.f,-85.f,-100.f}, /*11500*/
99 {-24.f,-24.f,-26.f,-32.f,-32.f,-42.f,-50.f,-60.f,-70.f,-85.f,-100.f}, /*16000*/
104 {{-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*63*/
105 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*88*/
106 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*125*/
107 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*175*/
108 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*250*/
109 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*350*/
110 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*500*/
111 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*700*/
112 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*1000*/
113 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*1400*/
114 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*2000*/
115 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*2800*/
116 {-14.f,-20.f,-20.f,-20.f,-26.f,-32.f,-40.f,-40.f,-40.f,-40.f,-40.f},/*4000*/
117 {-10.f,-12.f,-14.f,-16.f,-16.f,-20.f,-24.f,-30.f,-32.f,-40.f,-40.f},/*5600*/
118 {-10.f,-12.f,-14.f,-16.f,-16.f,-20.f,-24.f,-30.f,-32.f,-40.f,-40.f},/*8000*/
119 {-10.f,-10.f,-10.f,-12.f,-14.f,-18.f,-22.f,-28.f,-32.f,-40.f,-40.f},/*11500*/
120 {-10.f,-10.f,-10.f,-12.f,-14.f,-18.f,-22.f,-28.f,-32.f,-40.f,-40.f},/*16000*/
124 -10.f, /* suppress any noise curve over maxspec+n */
125 .5f, /* low window */
126 .5f, /* high window */
145 .900f, 0.f, /*11500*/
146 .900f, 1.f, /*16000*/
149 95.f, /* even decade + 5 is important; saves an rint() later in a
154 _vp_part0,_vp_couple0
157 static vorbis_info_floor1 _floor_set0={1,
172 6,3,10, 22,18,26, 41,36,47,
173 69,61,78, 112,99,126, 185,162,211,
174 329,282,387, 672,553,825
183 static vorbis_info_mapping0 mapping_info={1,{0,1},{0},{0},{0},0, 1, {0},{1}};
184 static codec_setup_info codec_setup0={ {0,0},
196 void analysis(char *base,int i,float *v,int n,int bark,int dB){
201 sprintf(buffer,"%s_%d.m",base,i);
202 of=fopen(buffer,"w");
209 fprintf(of,"%g ",toBARK(22050.f*j/n));
211 fprintf(of,"%g ",(float)j);
214 fprintf(of,"%g\n",todB(v+j));
216 fprintf(of,"%g\n",v[j]);
226 /****************************************************************/
228 int main(int argc,char *argv[]){
233 float ampmax=-9999,newmax;
234 float local_ampmax[2];
237 float ampmax_att_per_sec=-6.;
239 float *pcm[2],*out[2],*window,*flr[2],*mask[2],*work[2];
240 signed char *buffer,*buffer2;
243 vorbis_look_psy p_look;
244 vorbis_look_psy_global *pg_look;
245 vorbis_look_floor *floor_look;
266 framesize=atoi(argv[0]);
271 vi.codec_setup=&codec_setup0;
273 pcm[0]=_ogg_malloc(framesize*sizeof(float));
274 pcm[1]=_ogg_malloc(framesize*sizeof(float));
275 out[0]=_ogg_calloc(framesize/2,sizeof(float));
276 out[1]=_ogg_calloc(framesize/2,sizeof(float));
277 work[0]=_ogg_calloc(framesize,sizeof(float));
278 work[1]=_ogg_calloc(framesize,sizeof(float));
279 flr[0]=_ogg_calloc(framesize/2,sizeof(float));
280 flr[1]=_ogg_calloc(framesize/2,sizeof(float));
281 buffer=_ogg_malloc(framesize*4);
282 buffer2=buffer+framesize*2;
283 window=_vorbis_window_create(0,framesize,framesize/2,framesize/2);
284 mdct_init(&m_look,framesize);
285 drft_init(&f_look,framesize);
286 _vp_psy_init(&p_look,&_psy_set0,&_psy_set0G,framesize/2,44100);
287 pg_look=_vp_global_look(&vi);
288 floor_look=_floor_P[1]->look(NULL,NULL,&_floor_set0);
290 /* we cheat on the WAV header; we just bypass 44 bytes and never
291 verify that it matches 16bit/stereo/44.1kHz. */
293 fread(buffer,1,44,stdin);
294 fwrite(buffer,1,44,stdout);
295 memset(buffer,0,framesize*2);
297 analysis("window",0,window,framesize,0,0);
299 fprintf(stderr,"Processing for frame size %d...\n",framesize);
302 long bytes=fread(buffer2,1,framesize*2,stdin);
303 if(bytes<framesize*2)
304 memset(buffer2+bytes,0,framesize*2-bytes);
309 /* uninterleave samples */
310 for(i=0;i<framesize;i++){
311 pcm[0][i]=((buffer[i*4+1]<<8)|
312 (0x00ff&(int)buffer[i*4]))/32768.f;
313 pcm[1][i]=((buffer[i*4+3]<<8)|
314 (0x00ff&(int)buffer[i*4+2]))/32768.f;
318 float secs=framesize/44100.;
320 ampmax+=secs*ampmax_att_per_sec;
321 if(ampmax<-9999)ampmax=-9999;
325 float scale=4.f/framesize;
328 float *logmdct=mdct+framesize/2;
330 analysis("pre",frameno+i,pcm[i],framesize,0,0);
332 /* fft and mdct transforms */
333 for(j=0;j<framesize;j++)
334 fft[j]=pcm[i][j]*=window[j];
336 drft_forward(&f_look,fft);
338 local_ampmax[i]=-9999.f;
341 for(j=1;j<framesize-1;j+=2){
342 float temp=scale*FAST_HYPOT(fft[j],fft[j+1]);
343 temp=fft[(j+1)>>1]=todB(&temp);
344 if(temp>local_ampmax[i])local_ampmax[i]=temp;
346 if(local_ampmax[i]>ampmax)ampmax=local_ampmax[i];
348 mdct_forward(&m_look,pcm[i],mdct);
349 for(j=0;j<framesize/2;j++)
350 logmdct[j]=todB(mdct+j);
352 analysis("mdct",frameno+i,logmdct,framesize/2,1,0);
353 analysis("fft",frameno+i,fft,framesize/2,1,0);
361 float *logmdct=mdct+framesize/2;
362 float *mask=fft+framesize/2;
364 /* floor psychoacoustics */
365 _vp_compute_mask(&p_look,
375 analysis("mask",frameno+i,mask,framesize/2,1,0);
380 memset(&vd,0,sizeof(vd));
385 /* floor quantization/application */
386 nonzero[i]=_floor_P[1]->forward(&vb,floor_look,
395 _vp_remove_floor(&p_look,
403 for(j=0;j<framesize/2;j++)
404 if(fabs(pcm[i][j])>1500)
405 fprintf(stderr,"%ld ",frameno+i);
407 analysis("res",frameno+i,pcm[i],framesize/2,1,0);
408 analysis("codedflr",frameno+i,flr[i],framesize/2,1,1);
411 /* residue prequantization */
412 _vp_partition_prequant(&p_look,
418 analysis("quant",frameno+i,pcm[i],framesize/2,1,0);
420 /* channel coupling / stereo quantization */
428 analysis("coupled",frameno+i,pcm[i],framesize/2,1,0);
431 for(i=mapping_info.coupling_steps-1;i>=0;i--){
432 float *pcmM=pcm[mapping_info.coupling_mag[i]];
433 float *pcmA=pcm[mapping_info.coupling_ang[i]];
435 for(j=0;j<framesize/2;j++){
459 analysis("decoupled",frameno+i,pcm[i],framesize/2,1,0);
464 for(j=0;j<framesize/2;j++)
465 pcm[i][j]*=flr[i][j];
467 analysis("final",frameno+i,pcm[i],framesize/2,1,1);
469 /* take it back to time */
470 mdct_backward(&m_look,pcm[i],pcm[i]);
472 for(j=0;j<framesize/2;j++)
473 out[i][j]+=pcm[i][j]*window[j];
475 analysis("out",frameno+i,out[i],framesize/2,0,0);
480 /* write data. Use the part of buffer we're about to shift out */
482 char *ptr=buffer+i*2;
485 for(j=0;j<framesize/2;j++){
486 int val=mono[j]*32767.;
487 /* might as well guard against clipping */
489 if(!flag)fprintf(stderr,"clipping in frame %ld ",frameno+i);
494 if(!flag)fprintf(stderr,"clipping in frame %ld ",frameno+i);
499 ptr[1]=(val>>8)&0xff;
505 fwrite(buffer,1,framesize*2,stdout);
506 memmove(buffer,buffer2,framesize*2);
509 for(j=0,k=framesize/2;j<framesize/2;j++,k++)
510 out[i][j]=pcm[i][k]*window[k];
516 fprintf(stderr,"average raw bits of entropy: %.03g/sample\n",acc/tot);
517 fprintf(stderr,"average nonzero samples: %.03g/%d\n",nonz/tot*framesize/2,
519 fprintf(stderr,"Done\n\n");