1 /********************************************************************
3 * THIS FILE IS PART OF THE OggVorbis SOFTWARE CODEC SOURCE CODE. *
4 * USE, DISTRIBUTION AND REPRODUCTION OF THIS LIBRARY SOURCE IS *
5 * GOVERNED BY A BSD-STYLE SOURCE LICENSE INCLUDED WITH THIS SOURCE *
6 * IN 'COPYING'. PLEASE READ THESE TERMS BEFORE DISTRIBUTING. *
8 * THE OggVorbis SOURCE CODE IS (C) COPYRIGHT 1994-2001 *
9 * by the XIPHOPHORUS Company http://www.xiph.org/ *
11 ********************************************************************
13 function: residue backend 0, 1 and 2 implementation
14 last mod: $Id: res0.c,v 1.39 2001/12/16 04:15:47 xiphmont Exp $
16 ********************************************************************/
18 /* Slow, slow, slow, simpleminded and did I mention it was slow? The
19 encode/decode loops are coded for clarity and performance is not
20 yet even a nagging little idea lurking in the shadows. Oh and BTW,
27 #include "vorbis/codec.h"
28 #include "codec_internal.h"
39 vorbis_info_residue0 *info;
46 codebook ***partbooks;
55 int qoffsets[BITTRACK_DIVISOR+1];
58 long *training_data[8][64];
64 } vorbis_look_residue0;
66 vorbis_info_residue *res0_copy_info(vorbis_info_residue *vr){
67 vorbis_info_residue0 *info=(vorbis_info_residue0 *)vr;
68 vorbis_info_residue0 *ret=_ogg_malloc(sizeof(*ret));
69 memcpy(ret,info,sizeof(*ret));
73 void res0_free_info(vorbis_info_residue *i){
74 vorbis_info_residue0 *info=(vorbis_info_residue0 *)i;
76 memset(info,0,sizeof(*info));
81 void res0_free_look(vorbis_look_residue *i){
85 vorbis_look_residue0 *look=(vorbis_look_residue0 *)i;
90 for(j=0;j<look->parts;j++){
92 if(look->training_data[k][j]){
95 codebook *statebook=look->partbooks[j][k];
97 /* long and short into the same bucket by current convention */
98 sprintf(buffer,"res_part%d_pass%d.vqd",j,k);
101 for(l=0;l<statebook->entries;l++)
102 fprintf(of,"%d:%ld\n",l,look->training_data[k][j][l]);
106 _ogg_free(look->training_data[k][j]);
110 fprintf(stderr,"min/max residue: %g::%g\n",look->tmin,look->tmax);
112 fprintf(stderr,"residue bit usage %f:%f (%f total)\n",
113 (float)look->phrasebits/look->frames,
114 (float)look->postbits/look->frames,
115 (float)(look->postbits+look->phrasebits)/look->frames);
119 /*vorbis_info_residue0 *info=look->info;
122 "%ld frames encoded in %ld phrasebits and %ld residue bits "
123 "(%g/frame) \n",look->frames,look->phrasebits,
125 (look->phrasebits+look->resbitsflat)/(float)look->frames);
127 for(j=0;j<look->parts;j++){
129 fprintf(stderr,"\t[%d] == ",j);
130 for(k=0;k<look->stages;k++)
131 if((info->secondstages[j]>>k)&1){
132 fprintf(stderr,"%ld,",look->resbits[j][k]);
133 acc+=look->resbits[j][k];
136 fprintf(stderr,":: (%ld vals) %1.2fbits/sample\n",look->resvals[j],
137 acc?(float)acc/(look->resvals[j]*info->grouping):0);
139 fprintf(stderr,"\n");*/
141 for(j=0;j<look->parts;j++)
142 if(look->partbooks[j])_ogg_free(look->partbooks[j]);
143 _ogg_free(look->partbooks);
144 for(j=0;j<look->partvals;j++)
145 _ogg_free(look->decodemap[j]);
146 _ogg_free(look->decodemap);
148 memset(look,0,sizeof(*look));
153 static int ilog(unsigned int v){
162 static int icount(unsigned int v){
172 void res0_pack(vorbis_info_residue *vr,oggpack_buffer *opb){
173 vorbis_info_residue0 *info=(vorbis_info_residue0 *)vr;
175 oggpack_write(opb,info->begin,24);
176 oggpack_write(opb,info->end,24);
178 oggpack_write(opb,info->grouping-1,24); /* residue vectors to group and
179 code with a partitioned book */
180 oggpack_write(opb,info->partitions-1,6); /* possible partition choices */
181 oggpack_write(opb,info->groupbook,8); /* group huffman book */
183 /* secondstages is a bitmask; as encoding progresses pass by pass, a
184 bitmask of one indicates this partition class has bits to write
186 for(j=0;j<info->partitions;j++){
187 if(ilog(info->secondstages[j])>3){
188 /* yes, this is a minor hack due to not thinking ahead */
189 oggpack_write(opb,info->secondstages[j],3);
190 oggpack_write(opb,1,1);
191 oggpack_write(opb,info->secondstages[j]>>3,5);
193 oggpack_write(opb,info->secondstages[j],4); /* trailing zero */
194 acc+=icount(info->secondstages[j]);
197 oggpack_write(opb,info->booklist[j],8);
201 /* vorbis_info is for range checking */
202 vorbis_info_residue *res0_unpack(vorbis_info *vi,oggpack_buffer *opb){
204 vorbis_info_residue0 *info=_ogg_calloc(1,sizeof(*info));
205 codec_setup_info *ci=vi->codec_setup;
207 info->begin=oggpack_read(opb,24);
208 info->end=oggpack_read(opb,24);
209 info->grouping=oggpack_read(opb,24)+1;
210 info->partitions=oggpack_read(opb,6)+1;
211 info->groupbook=oggpack_read(opb,8);
213 for(j=0;j<info->partitions;j++){
214 int cascade=oggpack_read(opb,3);
215 if(oggpack_read(opb,1))
216 cascade|=(oggpack_read(opb,5)<<3);
217 info->secondstages[j]=cascade;
219 acc+=icount(cascade);
222 info->booklist[j]=oggpack_read(opb,8);
224 if(info->groupbook>=ci->books)goto errout;
226 if(info->booklist[j]>=ci->books)goto errout;
230 res0_free_info(info);
234 vorbis_look_residue *res0_look(vorbis_dsp_state *vd,vorbis_info_mode *vm,
235 vorbis_info_residue *vr){
236 vorbis_info_residue0 *info=(vorbis_info_residue0 *)vr;
237 vorbis_look_residue0 *look=_ogg_calloc(1,sizeof(*look));
238 backend_lookup_state *be=vd->backend_state;
244 look->map=vm->mapping;
246 look->parts=info->partitions;
247 look->fullbooks=be->fullbooks;
248 look->phrasebook=be->fullbooks+info->groupbook;
249 dim=look->phrasebook->dim;
251 look->partbooks=_ogg_calloc(look->parts,sizeof(*look->partbooks));
253 for(j=0;j<look->parts;j++){
254 int stages=ilog(info->secondstages[j]);
256 if(stages>maxstage)maxstage=stages;
257 look->partbooks[j]=_ogg_calloc(stages,sizeof(*look->partbooks[j]));
258 for(k=0;k<stages;k++)
259 if(info->secondstages[j]&(1<<k)){
260 look->partbooks[j][k]=be->fullbooks+info->booklist[acc++];
262 look->training_data[k][j]=calloc(look->partbooks[j][k]->entries,
263 sizeof(***look->training_data));
269 look->partvals=rint(pow(look->parts,dim));
270 look->stages=maxstage;
271 look->decodemap=_ogg_malloc(look->partvals*sizeof(*look->decodemap));
272 for(j=0;j<look->partvals;j++){
274 long mult=look->partvals/look->parts;
275 look->decodemap[j]=_ogg_malloc(dim*sizeof(*look->decodemap[j]));
280 look->decodemap[j][k]=deco;
285 int samples_per_partition=info->grouping;
286 int n=info->end-info->begin,i;
287 int partvals=n/samples_per_partition;
289 for(i=0;i<BITTRACK_DIVISOR;i++)
290 look->qoffsets[i]=partvals*(i+1)/BITTRACK_DIVISOR;
292 look->qoffsets[i]=9999999;
299 /* does not guard against invalid settings; eg, a subn of 16 and a
300 subgroup request of 32. Max subn of 128 */
301 static int _interleaved_testhack(float *vec,int n,vorbis_look_residue0 *look,
302 int auxparts,int auxpartnum){
303 vorbis_info_residue0 *info=look->info;
305 float max,localmax=0.f;
310 for(i=0;i<n;i++)temp[i]=fabs(vec[i]);
312 /* handle case subgrp==1 outside */
314 if(temp[i]>localmax)localmax=temp[i];
317 for(i=0;i<n;i++)temp[i]=rint(temp[i]);
330 if(temp[i]>localmax)localmax=temp[i];
333 for(i=0;i<auxparts-1;i++)
334 if(auxpartnum<info->blimit[i] &&
335 entropy[info->subgrp[i]]<=info->entmax[i] &&
336 max<=info->ampmax[i])
342 static int _testhack(float *vec,int n,vorbis_look_residue0 *look,
343 int auxparts,int auxpartnum){
344 vorbis_info_residue0 *info=look->info;
351 for(i=0;i<n;i++)temp[i]=fabs(vec[i]);
354 if(temp[i]>max)max=temp[i];
356 for(i=0;i<n;i++)temp[i]=rint(temp[i]);
361 for(i=0;i<auxparts-1;i++)
362 if(auxpartnum<info->blimit[i] &&
363 entropy<=info->entmax[i] &&
364 max<=info->ampmax[i])
370 static int _interleaved_encodepart(oggpack_buffer *opb,float *vec, int n,
371 codebook *book,vorbis_look_residue0 *look,
378 int entry=vorbis_book_besterror(book,vec+i,step,0);
384 bits+=vorbis_book_encode(book,entry,opb);
390 static int _encodepart(oggpack_buffer *opb,float *vec, int n,
391 codebook *book,vorbis_look_residue0 *look,
398 int entry=vorbis_book_besterror(book,vec+i*dim,1,0);
404 bits+=vorbis_book_encode(book,entry,opb);
410 static long **_01class(vorbis_block *vb,vorbis_look_residue *vl,
412 int (*classify)(float *,int,vorbis_look_residue0 *,
415 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
416 vorbis_info_residue0 *info=look->info;
418 /* move all this setup out later */
419 int samples_per_partition=info->grouping;
420 int possible_partitions=info->partitions;
421 int n=info->end-info->begin;
423 int partvals=n/samples_per_partition;
424 long **partword=_vorbis_block_alloc(vb,ch*sizeof(*partword));
426 /* we find the partition type for each partition of each
427 channel. We'll go back and do the interleaved encoding in a
428 bit. For now, clarity */
431 partword[i]=_vorbis_block_alloc(vb,n/samples_per_partition*sizeof(*partword[i]));
432 memset(partword[i],0,n/samples_per_partition*sizeof(*partword[i]));
435 for(i=0;i<partvals;i++){
437 /* do the partition decision based on the 'entropy'
440 classify(in[j]+i*samples_per_partition+info->begin,
441 samples_per_partition,look,possible_partitions,i);
452 sprintf(buffer,"resaux_%s.vqd",(vb->mode?"long":"short"));
453 of=fopen(buffer,"a");
454 for(j=0;j<partvals;j++)
455 fprintf(of,"%ld, ",partword[i][j]);
466 static long **_2class(vorbis_block *vb,vorbis_look_residue *vl,
468 int (*classify)(float *,int,vorbis_look_residue0 *,
471 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
472 vorbis_info_residue0 *info=look->info;
474 /* move all this setup out later */
475 int samples_per_partition=info->grouping;
476 int possible_partitions=info->partitions;
477 int n=info->end-info->begin;
479 int partvals=n/samples_per_partition;
480 long **partword=_vorbis_block_alloc(vb,sizeof(*partword));
481 float *work=alloca(sizeof(*work)*samples_per_partition);
488 partword[0]=_vorbis_block_alloc(vb,n*ch/samples_per_partition*sizeof(*partword[0]));
489 memset(partword[0],0,n*ch/samples_per_partition*sizeof(*partword[0]));
491 for(i=0,j=0,k=0,l=info->begin;i<partvals;i++){
492 for(k=0;k<samples_per_partition;k++){
502 classify(work,samples_per_partition,look,possible_partitions,i);
509 sprintf(buffer,"resaux_%s.vqd",(vb->mode?"long":"short"));
510 of=fopen(buffer,"a");
511 for(i=0;i<partvals;i++)
512 fprintf(of,"%ld, ",partword[0][i]);
522 static int _01forward(vorbis_block *vb,vorbis_look_residue *vl,
524 int pass,long **partword,
525 int (*encode)(oggpack_buffer *,float *,int,
526 codebook *,vorbis_look_residue0 *,long *),
527 ogg_uint32_t *stats){
529 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
530 vorbis_info_residue0 *info=look->info;
532 vorbis_dsp_state *vd=vb->vd;
533 vorbis_info *vi=vd->vi;
534 codec_setup_info *ci=vi->codec_setup;
537 /* move all this setup out later */
538 int samples_per_partition=info->grouping;
539 int possible_partitions=info->partitions;
540 int partitions_per_word=look->phrasebook->dim;
541 int n=info->end-info->begin;
543 int partvals=n/samples_per_partition;
549 for(j=info->begin;j<info->end;j++){
550 if(in[i][j]>look->tmax)look->tmax=in[i][j];
551 if(in[i][j]<look->tmin)look->tmin=in[i][j];
555 memset(resbits,0,sizeof(resbits));
556 memset(resvals,0,sizeof(resvals));
558 /* we code the partition words for each channel, then the residual
559 words for a partition per channel until we've written all the
560 residual words for that partition word. Then write the next
561 partition channel words... */
563 for(s=(pass==0?0:ci->passlimit[pass-1]);s<ci->passlimit[pass];s++){
565 ogg_uint32_t *qptr=NULL;
566 if(stats)qptr=stats+s*BITTRACK_DIVISOR;
568 for(i=0;i<partvals;){
570 /* first we encode a partition codeword for each channel */
573 long val=partword[j][i];
575 for(k=1;k<partitions_per_word;k++){
576 val*=possible_partitions;
578 val+=partword[j][i+k];
582 if(val<look->phrasebook->entries)
583 ret=vorbis_book_encode(look->phrasebook,val,&vb->opb);
588 look->phrasebits+=ret;
593 /* now we encode interleaved residual values for the partitions */
594 for(k=0;k<partitions_per_word && i<partvals;k++,i++){
595 long offset=i*samples_per_partition+info->begin;
597 if(qptr)while(i>=look->qoffsets[bin])
598 qptr[bin++]=oggpack_bits(&vb->opb);
601 if(s==0)resvals[partword[j][i]]+=samples_per_partition;
602 if(info->secondstages[partword[j][i]]&(1<<s)){
603 codebook *statebook=look->partbooks[partword[j][i]][s];
607 long *accumulator=NULL;
610 accumulator=look->training_data[s][partword[j][i]];
613 ret=encode(&vb->opb,in[j]+offset,samples_per_partition,
614 statebook,look,accumulator);
617 resbits[partword[j][i]]+=ret;
622 if(qptr)while(i>=look->qoffsets[bin])
623 qptr[bin++]=oggpack_bits(&vb->opb);
630 fprintf(stderr,"%d :: ",vb->mode);
631 for(k=0;k<possible_partitions;k++){
632 fprintf(stderr,"%ld/%1.2g, ",resvals[k],(float)resbits[k]/resvals[k]);
634 totalbits+=resbits[k];
637 fprintf(stderr,":: %ld:%1.2g\n",total,(double)totalbits/total);
642 /* a truncated packet here just means 'stop working'; it's not an error */
643 static int _01inverse(vorbis_block *vb,vorbis_look_residue *vl,
645 long (*decodepart)(codebook *, float *,
646 oggpack_buffer *,int)){
649 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
650 vorbis_info_residue0 *info=look->info;
652 /* move all this setup out later */
653 int samples_per_partition=info->grouping;
654 int partitions_per_word=look->phrasebook->dim;
655 int n=info->end-info->begin;
657 int partvals=n/samples_per_partition;
658 int partwords=(partvals+partitions_per_word-1)/partitions_per_word;
659 int ***partword=alloca(ch*sizeof(*partword));
662 partword[j]=_vorbis_block_alloc(vb,partwords*sizeof(*partword[j]));
664 for(s=0;s<look->stages;s++){
666 /* each loop decodes on partition codeword containing
667 partitions_pre_word partitions */
668 for(i=0,l=0;i<partvals;l++){
670 /* fetch the partition word for each channel */
672 int temp=vorbis_book_decode(look->phrasebook,&vb->opb);
673 if(temp==-1)goto eopbreak;
674 partword[j][l]=look->decodemap[temp];
675 if(partword[j][l]==NULL)goto errout;
679 /* now we decode residual values for the partitions */
680 for(k=0;k<partitions_per_word && i<partvals;k++,i++)
682 long offset=info->begin+i*samples_per_partition;
683 if(info->secondstages[partword[j][l][k]]&(1<<s)){
684 codebook *stagebook=look->partbooks[partword[j][l][k]][s];
686 if(decodepart(stagebook,in[j]+offset,&vb->opb,
687 samples_per_partition)==-1)goto eopbreak;
699 /* residue 0 and 1 are just slight variants of one another. 0 is
700 interleaved, 1 is not */
701 long **res0_class(vorbis_block *vb,vorbis_look_residue *vl,
702 float **in,int *nonzero,int ch){
703 /* we encode only the nonzero parts of a bundle */
709 /*return(_01class(vb,vl,in,used,_interleaved_testhack));*/
710 return(_01class(vb,vl,in,used,_testhack));
715 int res0_forward(vorbis_block *vb,vorbis_look_residue *vl,
716 float **in,float **out,int *nonzero,int ch,
717 int pass, long **partword,ogg_uint32_t *stats){
718 /* we encode only the nonzero parts of a bundle */
719 int i,j,used=0,n=vb->pcmend/2;
727 int ret=_01forward(vb,vl,in,used,pass,partword,
728 _interleaved_encodepart,stats);
733 out[i][j]-=in[used][j];
738 for(i=0;i<vorbis_bitrate_maxmarkers();i++)
739 stats[i]=oggpack_bits(&vb->opb);
745 int res0_inverse(vorbis_block *vb,vorbis_look_residue *vl,
746 float **in,int *nonzero,int ch){
752 return(_01inverse(vb,vl,in,used,vorbis_book_decodevs_add));
757 int res1_forward(vorbis_block *vb,vorbis_look_residue *vl,
758 float **in,float **out,int *nonzero,int ch,
759 int pass, long **partword, ogg_uint32_t *stats){
760 int i,j,used=0,n=vb->pcmend/2;
769 int ret=_01forward(vb,vl,in,used,pass,partword,_encodepart,stats);
774 out[i][j]-=in[used][j];
779 for(i=0;i<vorbis_bitrate_maxmarkers();i++)
780 stats[i]=oggpack_bits(&vb->opb);
786 long **res1_class(vorbis_block *vb,vorbis_look_residue *vl,
787 float **in,int *nonzero,int ch){
793 return(_01class(vb,vl,in,used,_testhack));
798 int res1_inverse(vorbis_block *vb,vorbis_look_residue *vl,
799 float **in,int *nonzero,int ch){
805 return(_01inverse(vb,vl,in,used,vorbis_book_decodev_add));
810 long **res2_class(vorbis_block *vb,vorbis_look_residue *vl,
811 float **in,int *nonzero,int ch){
817 return(_2class(vb,vl,in,used,_testhack));
822 /* res2 is slightly more different; all the channels are interleaved
823 into a single vector and encoded. */
825 int res2_forward(vorbis_block *vb,vorbis_look_residue *vl,
826 float **in,float **out,int *nonzero,int ch,
827 int pass,long **partword,ogg_uint32_t *stats){
828 long i,j,k,n=vb->pcmend/2,used=0;
830 /* don't duplicate the code; use a working vector hack for now and
831 reshape ourselves into a single channel res1 */
832 /* ugly; reallocs for each coupling pass :-( */
833 float *work=_vorbis_block_alloc(vb,ch*n*sizeof(*work));
836 if(nonzero[i])used++;
837 for(j=0,k=i;j<n;j++,k+=ch)
842 int ret=_01forward(vb,vl,&work,1,pass,partword,_encodepart,stats);
843 /* update the sofar vector */
847 for(j=0,k=i;j<n;j++,k+=ch)
848 sofar[j]+=pcm[j]-work[k];
853 for(i=0;i<vorbis_bitrate_maxmarkers();i++)
854 stats[i]=oggpack_bits(&vb->opb);
860 /* duplicate code here as speed is somewhat more important */
861 int res2_inverse(vorbis_block *vb,vorbis_look_residue *vl,
862 float **in,int *nonzero,int ch){
864 vorbis_look_residue0 *look=(vorbis_look_residue0 *)vl;
865 vorbis_info_residue0 *info=look->info;
867 /* move all this setup out later */
868 int samples_per_partition=info->grouping;
869 int partitions_per_word=look->phrasebook->dim;
870 int n=info->end-info->begin;
872 int partvals=n/samples_per_partition;
873 int partwords=(partvals+partitions_per_word-1)/partitions_per_word;
874 int **partword=_vorbis_block_alloc(vb,partwords*sizeof(*partword));
876 for(i=0;i<ch;i++)if(nonzero[i])break;
877 if(i==ch)return(0); /* no nonzero vectors */
879 for(s=0;s<look->stages;s++){
880 for(i=0,l=0;i<partvals;l++){
883 /* fetch the partition word */
884 int temp=vorbis_book_decode(look->phrasebook,&vb->opb);
885 if(temp==-1)goto eopbreak;
886 partword[l]=look->decodemap[temp];
887 if(partword[l]==NULL)goto errout;
890 /* now we decode residual values for the partitions */
891 for(k=0;k<partitions_per_word && i<partvals;k++,i++)
892 if(info->secondstages[partword[l][k]]&(1<<s)){
893 codebook *stagebook=look->partbooks[partword[l][k]][s];
896 if(vorbis_book_decodevv_add(stagebook,in,
897 i*samples_per_partition+info->begin,ch,
898 &vb->opb,samples_per_partition)==-1)
911 vorbis_func_residue residue0_exportbundle={
923 vorbis_func_residue residue1_exportbundle={
935 vorbis_func_residue residue2_exportbundle={