1 /********************************************************************
3 * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE. *
4 * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS *
5 * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE *
6 * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING. *
8 * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2001 *
9 * by the XIPHOPHORUS Company http://www.xiph.org/ *
11 ********************************************************************
13 function: residue backend 0, 1 and 2 implementation
14 last mod: $Id: res0.c,v 1.38 2001/12/12 09:45:25 xiphmont Exp $
16 ********************************************************************/
18 /* Slow, slow, slow, simpleminded and did I mention it was slow? The
19 encode/decode loops are coded for clarity and performance is not
20 yet even a nagging little idea lurking in the shadows. Oh and BTW,
28 #include "vorbis/codec.h"
29 #include "codec_internal.h"
36 vorbis_info_residue0 *info;
43 codebook ***partbooks;
52 int qoffsets[BITTRACK_DIVISOR+1];
54 } vorbis_look_residue0;
56 vorbis_info_residue *res0_copy_info(vorbis_info_residue *vr){
57 vorbis_info_residue0 *info=(vorbis_info_residue0 *)vr;
58 vorbis_info_residue0 *ret=_ogg_malloc(sizeof(*ret));
59 memcpy(ret,info,sizeof(*ret));
63 void res0_free_info(vorbis_info_residue *i){
64 vorbis_info_residue0 *info=(vorbis_info_residue0 *)i;
66 memset(info,0,sizeof(*info));
71 void res0_free_look(vorbis_look_residue *i){
75 vorbis_look_residue0 *look=(vorbis_look_residue0 *)i;
77 fprintf(stderr,"residue bit usage %f:%f (%f total)\n",
78 (float)look->phrasebits/look->frames,
79 (float)look->postbits/look->frames,
80 (float)(look->postbits+look->phrasebits)/look->frames);
82 /*vorbis_info_residue0 *info=look->info;
85 "%ld frames encoded in %ld phrasebits and %ld residue bits "
86 "(%g/frame) \n",look->frames,look->phrasebits,
88 (look->phrasebits+look->resbitsflat)/(float)look->frames);
90 for(j=0;j<look->parts;j++){
92 fprintf(stderr,"\t[%d] == ",j);
93 for(k=0;k<look->stages;k++)
94 if((info->secondstages[j]>>k)&1){
95 fprintf(stderr,"%ld,",look->resbits[j][k]);
96 acc+=look->resbits[j][k];
99 fprintf(stderr,":: (%ld vals) %1.2fbits/sample\n",look->resvals[j],
100 acc?(float)acc/(look->resvals[j]*info->grouping):0);
102 fprintf(stderr,"\n");*/
104 for(j=0;j<look->parts;j++)
105 if(look->partbooks[j])_ogg_free(look->partbooks[j]);
106 _ogg_free(look->partbooks);
107 for(j=0;j<look->partvals;j++)
108 _ogg_free(look->decodemap[j]);
109 _ogg_free(look->decodemap);
110 memset(look,0,sizeof(*look));
115 static int ilog(unsigned int v){
124 static int icount(unsigned int v){
134 void res0_pack(vorbis_info_residue *vr,oggpack_buffer *opb){
135 vorbis_info_residue0 *info=(vorbis_info_residue0 *)vr;
137 oggpack_write(opb,info->begin,24);
138 oggpack_write(opb,info->end,24);
140 oggpack_write(opb,info->grouping-1,24); /* residue vectors to group and
141 code with a partitioned book */
142 oggpack_write(opb,info->partitions-1,6); /* possible partition choices */
143 oggpack_write(opb,info->groupbook,8); /* group huffman book */
145 /* secondstages is a bitmask; as encoding progresses pass by pass, a
146 bitmask of one indicates this partition class has bits to write
148 for(j=0;j<info->partitions;j++){
149 if(ilog(info->secondstages[j])>3){
150 /* yes, this is a minor hack due to not thinking ahead */
151 oggpack_write(opb,info->secondstages[j],3);
152 oggpack_write(opb,1,1);
153 oggpack_write(opb,info->secondstages[j]>>3,5);
155 oggpack_write(opb,info->secondstages[j],4); /* trailing zero */
156 acc+=icount(info->secondstages[j]);
159 oggpack_write(opb,info->booklist[j],8);
163 /* vorbis_info is for range checking */
164 vorbis_info_residue *res0_unpack(vorbis_info *vi,oggpack_buffer *opb){
166 vorbis_info_residue0 *info=_ogg_calloc(1,sizeof(*info));
167 codec_setup_info *ci=vi->codec_setup;
169 info->begin=oggpack_read(opb,24);
170 info->end=oggpack_read(opb,24);
171 info->grouping=oggpack_read(opb,24)+1;
172 info->partitions=oggpack_read(opb,6)+1;
173 info->groupbook=oggpack_read(opb,8);
175 for(j=0;j<info->partitions;j++){
176 int cascade=oggpack_read(opb,3);
177 if(oggpack_read(opb,1))
178 cascade|=(oggpack_read(opb,5)<<3);
179 info->secondstages[j]=cascade;
181 acc+=icount(cascade);
184 info->booklist[j]=oggpack_read(opb,8);
186 if(info->groupbook>=ci->books)goto errout;
188 if(info->booklist[j]>=ci->books)goto errout;
192 res0_free_info(info);
196 vorbis_look_residue *res0_look(vorbis_dsp_state *vd,vorbis_info_mode *vm,
197 vorbis_info_residue *vr){
198 vorbis_info_residue0 *info=(vorbis_info_residue0 *)vr;
199 vorbis_look_residue0 *look=_ogg_calloc(1,sizeof(*look));
200 backend_lookup_state *be=vd->backend_state;
206 look->map=vm->mapping;
208 look->parts=info->partitions;
209 look->fullbooks=be->fullbooks;
210 look->phrasebook=be->fullbooks+info->groupbook;
211 dim=look->phrasebook->dim;
213 look->partbooks=_ogg_calloc(look->parts,sizeof(*look->partbooks));
215 for(j=0;j<look->parts;j++){
216 int stages=ilog(info->secondstages[j]);
218 if(stages>maxstage)maxstage=stages;
219 look->partbooks[j]=_ogg_calloc(stages,sizeof(*look->partbooks[j]));
220 for(k=0;k<stages;k++)
221 if(info->secondstages[j]&(1<<k))
222 look->partbooks[j][k]=be->fullbooks+info->booklist[acc++];
226 look->partvals=rint(pow(look->parts,dim));
227 look->stages=maxstage;
228 look->decodemap=_ogg_malloc(look->partvals*sizeof(*look->decodemap));
229 for(j=0;j<look->partvals;j++){
231 long mult=look->partvals/look->parts;
232 look->decodemap[j]=_ogg_malloc(dim*sizeof(*look->decodemap[j]));
237 look->decodemap[j][k]=deco;
242 int samples_per_partition=info->grouping;
243 int n=info->end-info->begin,i;
244 int partvals=n/samples_per_partition;
246 for(i=0;i<BITTRACK_DIVISOR;i++)
247 look->qoffsets[i]=partvals*(i+1)/BITTRACK_DIVISOR;
249 look->qoffsets[i]=9999999;
256 /* does not guard against invalid settings; eg, a subn of 16 and a
257 subgroup request of 32. Max subn of 128 */
258 static int _interleaved_testhack(float *vec,int n,vorbis_look_residue0 *look,
259 int auxparts,int auxpartnum){
260 vorbis_info_residue0 *info=look->info;
262 float max,localmax=0.f;
267 for(i=0;i<n;i++)temp[i]=fabs(vec[i]);
269 /* handle case subgrp==1 outside */
271 if(temp[i]>localmax)localmax=temp[i];
274 for(i=0;i<n;i++)temp[i]=rint(temp[i]);
287 if(temp[i]>localmax)localmax=temp[i];
290 for(i=0;i<auxparts-1;i++)
291 if(auxpartnum<info->blimit[i] &&
292 entropy[info->subgrp[i]]<=info->entmax[i] &&
293 max<=info->ampmax[i])
299 static int _testhack(float *vec,int n,vorbis_look_residue0 *look,
300 int auxparts,int auxpartnum){
301 vorbis_info_residue0 *info=look->info;
308 for(i=0;i<n;i++)temp[i]=fabs(vec[i]);
311 if(temp[i]>max)max=temp[i];
313 for(i=0;i<n;i++)temp[i]=rint(temp[i]);
318 for(i=0;i<auxparts-1;i++)
319 if(auxpartnum<info->blimit[i] &&
320 entropy<=info->entmax[i] &&
321 max<=info->ampmax[i])
327 static int _interleaved_encodepart(oggpack_buffer *opb,float *vec, int n,
328 codebook *book,vorbis_look_residue0 *look){
334 int entry=vorbis_book_besterror(book,vec+i,step,0);
336 bits+=vorbis_book_encode(book,entry,opb);
342 static int _encodepart(oggpack_buffer *opb,float *vec, int n,
343 codebook *book,vorbis_look_residue0 *look){
349 int entry=vorbis_book_besterror(book,vec+i*dim,1,0);
351 bits+=vorbis_book_encode(book,entry,opb);
357 static long **_01class(vorbis_block *vb,vorbis_look_residue *vl,
359 int (*classify)(float *,int,vorbis_look_residue0 *,
362 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
363 vorbis_info_residue0 *info=look->info;
365 /* move all this setup out later */
366 int samples_per_partition=info->grouping;
367 int possible_partitions=info->partitions;
368 int n=info->end-info->begin;
370 int partvals=n/samples_per_partition;
371 long **partword=_vorbis_block_alloc(vb,ch*sizeof(*partword));
373 /* we find the partition type for each partition of each
374 channel. We'll go back and do the interleaved encoding in a
375 bit. For now, clarity */
378 partword[i]=_vorbis_block_alloc(vb,n/samples_per_partition*sizeof(*partword[i]));
379 memset(partword[i],0,n/samples_per_partition*sizeof(*partword[i]));
382 for(i=0;i<partvals;i++){
384 /* do the partition decision based on the 'entropy'
387 classify(in[j]+i*samples_per_partition+info->begin,
388 samples_per_partition,look,possible_partitions,i);
398 sprintf(buffer,"resaux_%s.vqd",(vb->mode?"long":"short"));
399 of=fopen(buffer,"a");
400 for(j=0;j<partvals;j++)
401 fprintf(of,"%ld, ",partword[i][j]);
412 static long **_2class(vorbis_block *vb,vorbis_look_residue *vl,
414 int (*classify)(float *,int,vorbis_look_residue0 *,
417 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
418 vorbis_info_residue0 *info=look->info;
420 /* move all this setup out later */
421 int samples_per_partition=info->grouping;
422 int possible_partitions=info->partitions;
423 int n=info->end-info->begin;
425 int partvals=n/samples_per_partition;
426 long **partword=_vorbis_block_alloc(vb,sizeof(*partword));
427 float *work=alloca(sizeof(*work)*samples_per_partition);
434 partword[0]=_vorbis_block_alloc(vb,n*ch/samples_per_partition*sizeof(*partword[0]));
435 memset(partword[0],0,n*ch/samples_per_partition*sizeof(*partword[0]));
437 for(i=0,j=0,k=0,l=info->begin;i<partvals;i++){
438 for(k=0;k<samples_per_partition;k++){
448 classify(work,samples_per_partition,look,possible_partitions,i);
454 sprintf(buffer,"resaux_%s.vqd",(vb->mode?"long":"short"));
455 of=fopen(buffer,"a");
456 for(i=0;i<partvals;i++)
457 fprintf(of,"%ld, ",partword[0][i]);
467 static int _01forward(vorbis_block *vb,vorbis_look_residue *vl,
469 int pass,long **partword,
470 int (*encode)(oggpack_buffer *,float *,int,
471 codebook *,vorbis_look_residue0 *),
472 ogg_uint32_t *stats){
474 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
475 vorbis_info_residue0 *info=look->info;
477 vorbis_dsp_state *vd=vb->vd;
478 vorbis_info *vi=vd->vi;
479 codec_setup_info *ci=vi->codec_setup;
482 /* move all this setup out later */
483 int samples_per_partition=info->grouping;
484 int possible_partitions=info->partitions;
485 int partitions_per_word=look->phrasebook->dim;
486 int n=info->end-info->begin;
488 int partvals=n/samples_per_partition;
498 for(j=0;j<partvals;j++){
499 int class=partword[i][j];
500 float *ptr=in[i]+info->begin+j*samples_per_partition;
501 sprintf(buffer,"res_%s_part%d_it%d.vqd",(vb->mode?"long":"short"),
503 of=fopen(buffer,"a");
504 for(k=0;k<samples_per_partition;k++)
505 fprintf(of,"%.3f, ",ptr[k]);
512 memset(resbits,0,sizeof(resbits));
513 memset(resvals,0,sizeof(resvals));
515 /* we code the partition words for each channel, then the residual
516 words for a partition per channel until we've written all the
517 residual words for that partition word. Then write the next
518 partition channel words... */
520 for(s=(pass==0?0:ci->passlimit[pass-1]);s<ci->passlimit[pass];s++){
522 ogg_uint32_t *qptr=NULL;
523 if(stats)qptr=stats+s*BITTRACK_DIVISOR;
525 for(i=0;i<partvals;){
527 /* first we encode a partition codeword for each channel */
530 long val=partword[j][i];
532 for(k=1;k<partitions_per_word;k++){
533 val*=possible_partitions;
535 val+=partword[j][i+k];
539 if(val<look->phrasebook->entries)
540 ret=vorbis_book_encode(look->phrasebook,val,&vb->opb);
544 look->phrasebits+=ret;
549 /* now we encode interleaved residual values for the partitions */
550 for(k=0;k<partitions_per_word && i<partvals;k++,i++){
551 long offset=i*samples_per_partition+info->begin;
553 if(qptr)while(i>=look->qoffsets[bin])
554 qptr[bin++]=oggpack_bits(&vb->opb);
557 if(s==0)resvals[partword[j][i]]+=samples_per_partition;
558 if(info->secondstages[partword[j][i]]&(1<<s)){
559 codebook *statebook=look->partbooks[partword[j][i]][s];
561 int ret=encode(&vb->opb,in[j]+offset,samples_per_partition,
564 resbits[partword[j][i]]+=ret;
569 if(qptr)while(i>=look->qoffsets[bin])
570 qptr[bin++]=oggpack_bits(&vb->opb);
577 fprintf(stderr,"%d :: ",vb->mode);
578 for(k=0;k<possible_partitions;k++){
579 fprintf(stderr,"%ld/%1.2g, ",resvals[k],(float)resbits[k]/resvals[k]);
581 totalbits+=resbits[k];
584 fprintf(stderr,":: %ld:%1.2g\n",total,(double)totalbits/total);
589 /* a truncated packet here just means 'stop working'; it's not an error */
590 static int _01inverse(vorbis_block *vb,vorbis_look_residue *vl,
592 long (*decodepart)(codebook *, float *,
593 oggpack_buffer *,int)){
596 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
597 vorbis_info_residue0 *info=look->info;
599 /* move all this setup out later */
600 int samples_per_partition=info->grouping;
601 int partitions_per_word=look->phrasebook->dim;
602 int n=info->end-info->begin;
604 int partvals=n/samples_per_partition;
605 int partwords=(partvals+partitions_per_word-1)/partitions_per_word;
606 int ***partword=alloca(ch*sizeof(*partword));
609 partword[j]=_vorbis_block_alloc(vb,partwords*sizeof(*partword[j]));
611 for(s=0;s<look->stages;s++){
613 /* each loop decodes on partition codeword containing
614 partitions_pre_word partitions */
615 for(i=0,l=0;i<partvals;l++){
617 /* fetch the partition word for each channel */
619 int temp=vorbis_book_decode(look->phrasebook,&vb->opb);
620 if(temp==-1)goto eopbreak;
621 partword[j][l]=look->decodemap[temp];
622 if(partword[j][l]==NULL)goto errout;
626 /* now we decode residual values for the partitions */
627 for(k=0;k<partitions_per_word && i<partvals;k++,i++)
629 long offset=info->begin+i*samples_per_partition;
630 if(info->secondstages[partword[j][l][k]]&(1<<s)){
631 codebook *stagebook=look->partbooks[partword[j][l][k]][s];
633 if(decodepart(stagebook,in[j]+offset,&vb->opb,
634 samples_per_partition)==-1)goto eopbreak;
646 /* residue 0 and 1 are just slight variants of one another. 0 is
647 interleaved, 1 is not */
648 long **res0_class(vorbis_block *vb,vorbis_look_residue *vl,
649 float **in,int *nonzero,int ch){
650 /* we encode only the nonzero parts of a bundle */
656 /*return(_01class(vb,vl,in,used,_interleaved_testhack));*/
657 return(_01class(vb,vl,in,used,_testhack));
662 int res0_forward(vorbis_block *vb,vorbis_look_residue *vl,
663 float **in,float **out,int *nonzero,int ch,
664 int pass, long **partword,ogg_uint32_t *stats){
665 /* we encode only the nonzero parts of a bundle */
666 int i,j,used=0,n=vb->pcmend/2;
674 int ret=_01forward(vb,vl,in,used,pass,partword,
675 _interleaved_encodepart,stats);
680 out[i][j]-=in[used][j];
685 for(i=0;i<vorbis_bitrate_maxmarkers();i++)
686 stats[i]=oggpack_bits(&vb->opb);
692 int res0_inverse(vorbis_block *vb,vorbis_look_residue *vl,
693 float **in,int *nonzero,int ch){
699 return(_01inverse(vb,vl,in,used,vorbis_book_decodevs_add));
704 int res1_forward(vorbis_block *vb,vorbis_look_residue *vl,
705 float **in,float **out,int *nonzero,int ch,
706 int pass, long **partword, ogg_uint32_t *stats){
707 int i,j,used=0,n=vb->pcmend/2;
716 int ret=_01forward(vb,vl,in,used,pass,partword,_encodepart,stats);
721 out[i][j]-=in[used][j];
726 for(i=0;i<vorbis_bitrate_maxmarkers();i++)
727 stats[i]=oggpack_bits(&vb->opb);
733 long **res1_class(vorbis_block *vb,vorbis_look_residue *vl,
734 float **in,int *nonzero,int ch){
740 return(_01class(vb,vl,in,used,_testhack));
745 int res1_inverse(vorbis_block *vb,vorbis_look_residue *vl,
746 float **in,int *nonzero,int ch){
752 return(_01inverse(vb,vl,in,used,vorbis_book_decodev_add));
757 long **res2_class(vorbis_block *vb,vorbis_look_residue *vl,
758 float **in,int *nonzero,int ch){
764 return(_2class(vb,vl,in,used,_testhack));
769 /* res2 is slightly more different; all the channels are interleaved
770 into a single vector and encoded. */
772 int res2_forward(vorbis_block *vb,vorbis_look_residue *vl,
773 float **in,float **out,int *nonzero,int ch,
774 int pass,long **partword,ogg_uint32_t *stats){
775 long i,j,k,n=vb->pcmend/2,used=0;
777 /* don't duplicate the code; use a working vector hack for now and
778 reshape ourselves into a single channel res1 */
779 /* ugly; reallocs for each coupling pass :-( */
780 float *work=_vorbis_block_alloc(vb,ch*n*sizeof(*work));
783 if(nonzero[i])used++;
784 for(j=0,k=i;j<n;j++,k+=ch)
789 int ret=_01forward(vb,vl,&work,1,pass,partword,_encodepart,stats);
790 /* update the sofar vector */
794 for(j=0,k=i;j<n;j++,k+=ch)
796 sofar[j]+=pcm[j]; /* when training, our previous stage books
799 sofar[j]+=pcm[j]-work[k];
804 for(i=0;i<vorbis_bitrate_maxmarkers();i++)
805 stats[i]=oggpack_bits(&vb->opb);
811 /* duplicate code here as speed is somewhat more important */
812 int res2_inverse(vorbis_block *vb,vorbis_look_residue *vl,
813 float **in,int *nonzero,int ch){
815 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
816 vorbis_info_residue0 *info=look->info;
818 /* move all this setup out later */
819 int samples_per_partition=info->grouping;
820 int partitions_per_word=look->phrasebook->dim;
821 int n=info->end-info->begin;
823 int partvals=n/samples_per_partition;
824 int partwords=(partvals+partitions_per_word-1)/partitions_per_word;
825 int **partword=_vorbis_block_alloc(vb,partwords*sizeof(*partword));
827 for(i=0;i<ch;i++)if(nonzero[i])break;
828 if(i==ch)return(0); /* no nonzero vectors */
830 for(s=0;s<look->stages;s++){
831 for(i=0,l=0;i<partvals;l++){
834 /* fetch the partition word */
835 int temp=vorbis_book_decode(look->phrasebook,&vb->opb);
836 if(temp==-1)goto eopbreak;
837 partword[l]=look->decodemap[temp];
838 if(partword[l]==NULL)goto errout;
841 /* now we decode residual values for the partitions */
842 for(k=0;k<partitions_per_word && i<partvals;k++,i++)
843 if(info->secondstages[partword[l][k]]&(1<<s)){
844 codebook *stagebook=look->partbooks[partword[l][k]][s];
847 if(vorbis_book_decodevv_add(stagebook,in,
848 i*samples_per_partition+info->begin,ch,
849 &vb->opb,samples_per_partition)==-1)
862 vorbis_func_residue residue0_exportbundle={
874 vorbis_func_residue residue1_exportbundle={
886 vorbis_func_residue residue2_exportbundle={