src/libFLAC/stream_decoder.c : Fix buffer read overflow.
[platform/upstream/flac.git] / src / libFLAC / lpc.c
1 /* libFLAC - Free Lossless Audio Codec library
2  * Copyright (C) 2000-2009  Josh Coalson
3  * Copyright (C) 2011-2013  Xiph.Org Foundation
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  *
9  * - Redistributions of source code must retain the above copyright
10  * notice, this list of conditions and the following disclaimer.
11  *
12  * - Redistributions in binary form must reproduce the above copyright
13  * notice, this list of conditions and the following disclaimer in the
14  * documentation and/or other materials provided with the distribution.
15  *
16  * - Neither the name of the Xiph.org Foundation nor the names of its
17  * contributors may be used to endorse or promote products derived from
18  * this software without specific prior written permission.
19  *
20  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
21  * ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
22  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
23  * A PARTICULAR PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL THE FOUNDATION OR
24  * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
25  * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
26  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
27  * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
28  * LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
29  * NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
30  * SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
31  */
32
33 #if HAVE_CONFIG_H
34 #  include <config.h>
35 #endif
36
37 #include <math.h>
38
39 #include "FLAC/assert.h"
40 #include "FLAC/format.h"
41 #include "share/compat.h"
42 #include "private/bitmath.h"
43 #include "private/lpc.h"
44 #include "private/macros.h"
45 #if defined DEBUG || defined FLAC__OVERFLOW_DETECT || defined FLAC__OVERFLOW_DETECT_VERBOSE
46 #include <stdio.h>
47 #endif
48
49 /* OPT: #undef'ing this may improve the speed on some architectures */
50 #define FLAC__LPC_UNROLLED_FILTER_LOOPS
51
52 #ifndef FLAC__INTEGER_ONLY_LIBRARY
53
54 #ifndef M_LN2
55 /* math.h in VC++ doesn't seem to have this (how Microsoft is that?) */
56 #define M_LN2 0.69314718055994530942
57 #endif
58
59 #if !defined(HAVE_LROUND)
60 #if defined(_MSC_VER)
61 #include <float.h>
62 #define copysign _copysign
63 #elif defined(__GNUC__)
64 #define copysign __builtin_copysign
65 #endif
66 static inline long int lround(double x) {
67     return (long)(x + copysign (0.5, x));
68 }
69 //If this fails, we are in the precence of a mid 90's compiler..move along...
70 #endif
71
72 void FLAC__lpc_window_data(const FLAC__int32 in[], const FLAC__real window[], FLAC__real out[], unsigned data_len)
73 {
74         unsigned i;
75         for(i = 0; i < data_len; i++)
76                 out[i] = in[i] * window[i];
77 }
78
79 void FLAC__lpc_compute_autocorrelation(const FLAC__real data[], unsigned data_len, unsigned lag, FLAC__real autoc[])
80 {
81         /* a readable, but slower, version */
82 #if 0
83         FLAC__real d;
84         unsigned i;
85
86         FLAC__ASSERT(lag > 0);
87         FLAC__ASSERT(lag <= data_len);
88
89         /*
90          * Technically we should subtract the mean first like so:
91          *   for(i = 0; i < data_len; i++)
92          *     data[i] -= mean;
93          * but it appears not to make enough of a difference to matter, and
94          * most signals are already closely centered around zero
95          */
96         while(lag--) {
97                 for(i = lag, d = 0.0; i < data_len; i++)
98                         d += data[i] * data[i - lag];
99                 autoc[lag] = d;
100         }
101 #endif
102
103         /*
104          * this version tends to run faster because of better data locality
105          * ('data_len' is usually much larger than 'lag')
106          */
107         FLAC__real d;
108         unsigned sample, coeff;
109         const unsigned limit = data_len - lag;
110
111         FLAC__ASSERT(lag > 0);
112         FLAC__ASSERT(lag <= data_len);
113
114         for(coeff = 0; coeff < lag; coeff++)
115                 autoc[coeff] = 0.0;
116         for(sample = 0; sample <= limit; sample++) {
117                 d = data[sample];
118                 for(coeff = 0; coeff < lag; coeff++)
119                         autoc[coeff] += d * data[sample+coeff];
120         }
121         for(; sample < data_len; sample++) {
122                 d = data[sample];
123                 for(coeff = 0; coeff < data_len - sample; coeff++)
124                         autoc[coeff] += d * data[sample+coeff];
125         }
126 }
127
128 void FLAC__lpc_compute_lp_coefficients(const FLAC__real autoc[], unsigned *max_order, FLAC__real lp_coeff[][FLAC__MAX_LPC_ORDER], FLAC__double error[])
129 {
130         unsigned i, j;
131         FLAC__double r, err, lpc[FLAC__MAX_LPC_ORDER];
132
133         FLAC__ASSERT(0 != max_order);
134         FLAC__ASSERT(0 < *max_order);
135         FLAC__ASSERT(*max_order <= FLAC__MAX_LPC_ORDER);
136         FLAC__ASSERT(autoc[0] != 0.0);
137
138         err = autoc[0];
139
140         for(i = 0; i < *max_order; i++) {
141                 /* Sum up this iteration's reflection coefficient. */
142                 r = -autoc[i+1];
143                 for(j = 0; j < i; j++)
144                         r -= lpc[j] * autoc[i-j];
145                 r /= err;
146
147                 /* Update LPC coefficients and total error. */
148                 lpc[i]=r;
149                 for(j = 0; j < (i>>1); j++) {
150                         FLAC__double tmp = lpc[j];
151                         lpc[j] += r * lpc[i-1-j];
152                         lpc[i-1-j] += r * tmp;
153                 }
154                 if(i & 1)
155                         lpc[j] += lpc[j] * r;
156
157                 err *= (1.0 - r * r);
158
159                 /* save this order */
160                 for(j = 0; j <= i; j++)
161                         lp_coeff[i][j] = (FLAC__real)(-lpc[j]); /* negate FIR filter coeff to get predictor coeff */
162                 error[i] = err;
163
164                 /* see SF bug #1601812 http://sourceforge.net/tracker/index.php?func=detail&aid=1601812&group_id=13478&atid=113478 */
165                 if(err == 0.0) {
166                         *max_order = i+1;
167                         return;
168                 }
169         }
170 }
171
172 int FLAC__lpc_quantize_coefficients(const FLAC__real lp_coeff[], unsigned order, unsigned precision, FLAC__int32 qlp_coeff[], int *shift)
173 {
174         unsigned i;
175         FLAC__double cmax;
176         FLAC__int32 qmax, qmin;
177
178         FLAC__ASSERT(precision > 0);
179         FLAC__ASSERT(precision >= FLAC__MIN_QLP_COEFF_PRECISION);
180
181         /* drop one bit for the sign; from here on out we consider only |lp_coeff[i]| */
182         precision--;
183         qmax = 1 << precision;
184         qmin = -qmax;
185         qmax--;
186
187         /* calc cmax = max( |lp_coeff[i]| ) */
188         cmax = 0.0;
189         for(i = 0; i < order; i++) {
190                 const FLAC__double d = fabs(lp_coeff[i]);
191                 if(d > cmax)
192                         cmax = d;
193         }
194
195         if(cmax <= 0.0) {
196                 /* => coefficients are all 0, which means our constant-detect didn't work */
197                 return 2;
198         }
199         else {
200                 const int max_shiftlimit = (1 << (FLAC__SUBFRAME_LPC_QLP_SHIFT_LEN-1)) - 1;
201                 const int min_shiftlimit = -max_shiftlimit - 1;
202                 int log2cmax;
203
204                 (void)frexp(cmax, &log2cmax);
205                 log2cmax--;
206                 *shift = (int)precision - log2cmax - 1;
207
208                 if(*shift > max_shiftlimit)
209                         *shift = max_shiftlimit;
210                 else if(*shift < min_shiftlimit)
211                         return 1;
212         }
213
214         if(*shift >= 0) {
215                 FLAC__double error = 0.0;
216                 FLAC__int32 q;
217                 for(i = 0; i < order; i++) {
218                         error += lp_coeff[i] * (1 << *shift);
219                         q = lround(error);
220
221 #ifdef FLAC__OVERFLOW_DETECT
222                         if(q > qmax+1) /* we expect q==qmax+1 occasionally due to rounding */
223                                 fprintf(stderr,"FLAC__lpc_quantize_coefficients: quantizer overflow: q>qmax %d>%d shift=%d cmax=%f precision=%u lpc[%u]=%f\n",q,qmax,*shift,cmax,precision+1,i,lp_coeff[i]);
224                         else if(q < qmin)
225                                 fprintf(stderr,"FLAC__lpc_quantize_coefficients: quantizer overflow: q<qmin %d<%d shift=%d cmax=%f precision=%u lpc[%u]=%f\n",q,qmin,*shift,cmax,precision+1,i,lp_coeff[i]);
226 #endif
227                         if(q > qmax)
228                                 q = qmax;
229                         else if(q < qmin)
230                                 q = qmin;
231                         error -= q;
232                         qlp_coeff[i] = q;
233                 }
234         }
235         /* negative shift is very rare but due to design flaw, negative shift is
236          * a NOP in the decoder, so it must be handled specially by scaling down
237          * coeffs
238          */
239         else {
240                 const int nshift = -(*shift);
241                 FLAC__double error = 0.0;
242                 FLAC__int32 q;
243 #ifdef DEBUG
244                 fprintf(stderr,"FLAC__lpc_quantize_coefficients: negative shift=%d order=%u cmax=%f\n", *shift, order, cmax);
245 #endif
246                 for(i = 0; i < order; i++) {
247                         error += lp_coeff[i] / (1 << nshift);
248                         q = lround(error);
249 #ifdef FLAC__OVERFLOW_DETECT
250                         if(q > qmax+1) /* we expect q==qmax+1 occasionally due to rounding */
251                                 fprintf(stderr,"FLAC__lpc_quantize_coefficients: quantizer overflow: q>qmax %d>%d shift=%d cmax=%f precision=%u lpc[%u]=%f\n",q,qmax,*shift,cmax,precision+1,i,lp_coeff[i]);
252                         else if(q < qmin)
253                                 fprintf(stderr,"FLAC__lpc_quantize_coefficients: quantizer overflow: q<qmin %d<%d shift=%d cmax=%f precision=%u lpc[%u]=%f\n",q,qmin,*shift,cmax,precision+1,i,lp_coeff[i]);
254 #endif
255                         if(q > qmax)
256                                 q = qmax;
257                         else if(q < qmin)
258                                 q = qmin;
259                         error -= q;
260                         qlp_coeff[i] = q;
261                 }
262                 *shift = 0;
263         }
264
265         return 0;
266 }
267
268 void FLAC__lpc_compute_residual_from_qlp_coefficients(const FLAC__int32 *data, unsigned data_len, const FLAC__int32 qlp_coeff[], unsigned order, int lp_quantization, FLAC__int32 residual[])
269 #if defined(FLAC__OVERFLOW_DETECT) || !defined(FLAC__LPC_UNROLLED_FILTER_LOOPS)
270 {
271         FLAC__int64 sumo;
272         unsigned i, j;
273         FLAC__int32 sum;
274         const FLAC__int32 *history;
275
276 #ifdef FLAC__OVERFLOW_DETECT_VERBOSE
277         fprintf(stderr,"FLAC__lpc_compute_residual_from_qlp_coefficients: data_len=%d, order=%u, lpq=%d",data_len,order,lp_quantization);
278         for(i=0;i<order;i++)
279                 fprintf(stderr,", q[%u]=%d",i,qlp_coeff[i]);
280         fprintf(stderr,"\n");
281 #endif
282         FLAC__ASSERT(order > 0);
283
284         for(i = 0; i < data_len; i++) {
285                 sumo = 0;
286                 sum = 0;
287                 history = data;
288                 for(j = 0; j < order; j++) {
289                         sum += qlp_coeff[j] * (*(--history));
290                         sumo += (FLAC__int64)qlp_coeff[j] * (FLAC__int64)(*history);
291                                 fprintf(stderr,"FLAC__lpc_compute_residual_from_qlp_coefficients: OVERFLOW, i=%u, j=%u, c=%d, d=%d, sumo=%" PRId64 "\n",i,j,qlp_coeff[j],*history,sumo);
292                 }
293                 *(residual++) = *(data++) - (sum >> lp_quantization);
294         }
295
296         /* Here's a slower but clearer version:
297         for(i = 0; i < data_len; i++) {
298                 sum = 0;
299                 for(j = 0; j < order; j++)
300                         sum += qlp_coeff[j] * data[i-j-1];
301                 residual[i] = data[i] - (sum >> lp_quantization);
302         }
303         */
304 }
305 #else /* fully unrolled version for normal use */
306 {
307         int i;
308         FLAC__int32 sum;
309
310         FLAC__ASSERT(order > 0);
311         FLAC__ASSERT(order <= 32);
312
313         /*
314          * We do unique versions up to 12th order since that's the subset limit.
315          * Also they are roughly ordered to match frequency of occurrence to
316          * minimize branching.
317          */
318         if(order <= 12) {
319                 if(order > 8) {
320                         if(order > 10) {
321                                 if(order == 12) {
322                                         for(i = 0; i < (int)data_len; i++) {
323                                                 sum = 0;
324                                                 sum += qlp_coeff[11] * data[i-12];
325                                                 sum += qlp_coeff[10] * data[i-11];
326                                                 sum += qlp_coeff[9] * data[i-10];
327                                                 sum += qlp_coeff[8] * data[i-9];
328                                                 sum += qlp_coeff[7] * data[i-8];
329                                                 sum += qlp_coeff[6] * data[i-7];
330                                                 sum += qlp_coeff[5] * data[i-6];
331                                                 sum += qlp_coeff[4] * data[i-5];
332                                                 sum += qlp_coeff[3] * data[i-4];
333                                                 sum += qlp_coeff[2] * data[i-3];
334                                                 sum += qlp_coeff[1] * data[i-2];
335                                                 sum += qlp_coeff[0] * data[i-1];
336                                                 residual[i] = data[i] - (sum >> lp_quantization);
337                                         }
338                                 }
339                                 else { /* order == 11 */
340                                         for(i = 0; i < (int)data_len; i++) {
341                                                 sum = 0;
342                                                 sum += qlp_coeff[10] * data[i-11];
343                                                 sum += qlp_coeff[9] * data[i-10];
344                                                 sum += qlp_coeff[8] * data[i-9];
345                                                 sum += qlp_coeff[7] * data[i-8];
346                                                 sum += qlp_coeff[6] * data[i-7];
347                                                 sum += qlp_coeff[5] * data[i-6];
348                                                 sum += qlp_coeff[4] * data[i-5];
349                                                 sum += qlp_coeff[3] * data[i-4];
350                                                 sum += qlp_coeff[2] * data[i-3];
351                                                 sum += qlp_coeff[1] * data[i-2];
352                                                 sum += qlp_coeff[0] * data[i-1];
353                                                 residual[i] = data[i] - (sum >> lp_quantization);
354                                         }
355                                 }
356                         }
357                         else {
358                                 if(order == 10) {
359                                         for(i = 0; i < (int)data_len; i++) {
360                                                 sum = 0;
361                                                 sum += qlp_coeff[9] * data[i-10];
362                                                 sum += qlp_coeff[8] * data[i-9];
363                                                 sum += qlp_coeff[7] * data[i-8];
364                                                 sum += qlp_coeff[6] * data[i-7];
365                                                 sum += qlp_coeff[5] * data[i-6];
366                                                 sum += qlp_coeff[4] * data[i-5];
367                                                 sum += qlp_coeff[3] * data[i-4];
368                                                 sum += qlp_coeff[2] * data[i-3];
369                                                 sum += qlp_coeff[1] * data[i-2];
370                                                 sum += qlp_coeff[0] * data[i-1];
371                                                 residual[i] = data[i] - (sum >> lp_quantization);
372                                         }
373                                 }
374                                 else { /* order == 9 */
375                                         for(i = 0; i < (int)data_len; i++) {
376                                                 sum = 0;
377                                                 sum += qlp_coeff[8] * data[i-9];
378                                                 sum += qlp_coeff[7] * data[i-8];
379                                                 sum += qlp_coeff[6] * data[i-7];
380                                                 sum += qlp_coeff[5] * data[i-6];
381                                                 sum += qlp_coeff[4] * data[i-5];
382                                                 sum += qlp_coeff[3] * data[i-4];
383                                                 sum += qlp_coeff[2] * data[i-3];
384                                                 sum += qlp_coeff[1] * data[i-2];
385                                                 sum += qlp_coeff[0] * data[i-1];
386                                                 residual[i] = data[i] - (sum >> lp_quantization);
387                                         }
388                                 }
389                         }
390                 }
391                 else if(order > 4) {
392                         if(order > 6) {
393                                 if(order == 8) {
394                                         for(i = 0; i < (int)data_len; i++) {
395                                                 sum = 0;
396                                                 sum += qlp_coeff[7] * data[i-8];
397                                                 sum += qlp_coeff[6] * data[i-7];
398                                                 sum += qlp_coeff[5] * data[i-6];
399                                                 sum += qlp_coeff[4] * data[i-5];
400                                                 sum += qlp_coeff[3] * data[i-4];
401                                                 sum += qlp_coeff[2] * data[i-3];
402                                                 sum += qlp_coeff[1] * data[i-2];
403                                                 sum += qlp_coeff[0] * data[i-1];
404                                                 residual[i] = data[i] - (sum >> lp_quantization);
405                                         }
406                                 }
407                                 else { /* order == 7 */
408                                         for(i = 0; i < (int)data_len; i++) {
409                                                 sum = 0;
410                                                 sum += qlp_coeff[6] * data[i-7];
411                                                 sum += qlp_coeff[5] * data[i-6];
412                                                 sum += qlp_coeff[4] * data[i-5];
413                                                 sum += qlp_coeff[3] * data[i-4];
414                                                 sum += qlp_coeff[2] * data[i-3];
415                                                 sum += qlp_coeff[1] * data[i-2];
416                                                 sum += qlp_coeff[0] * data[i-1];
417                                                 residual[i] = data[i] - (sum >> lp_quantization);
418                                         }
419                                 }
420                         }
421                         else {
422                                 if(order == 6) {
423                                         for(i = 0; i < (int)data_len; i++) {
424                                                 sum = 0;
425                                                 sum += qlp_coeff[5] * data[i-6];
426                                                 sum += qlp_coeff[4] * data[i-5];
427                                                 sum += qlp_coeff[3] * data[i-4];
428                                                 sum += qlp_coeff[2] * data[i-3];
429                                                 sum += qlp_coeff[1] * data[i-2];
430                                                 sum += qlp_coeff[0] * data[i-1];
431                                                 residual[i] = data[i] - (sum >> lp_quantization);
432                                         }
433                                 }
434                                 else { /* order == 5 */
435                                         for(i = 0; i < (int)data_len; i++) {
436                                                 sum = 0;
437                                                 sum += qlp_coeff[4] * data[i-5];
438                                                 sum += qlp_coeff[3] * data[i-4];
439                                                 sum += qlp_coeff[2] * data[i-3];
440                                                 sum += qlp_coeff[1] * data[i-2];
441                                                 sum += qlp_coeff[0] * data[i-1];
442                                                 residual[i] = data[i] - (sum >> lp_quantization);
443                                         }
444                                 }
445                         }
446                 }
447                 else {
448                         if(order > 2) {
449                                 if(order == 4) {
450                                         for(i = 0; i < (int)data_len; i++) {
451                                                 sum = 0;
452                                                 sum += qlp_coeff[3] * data[i-4];
453                                                 sum += qlp_coeff[2] * data[i-3];
454                                                 sum += qlp_coeff[1] * data[i-2];
455                                                 sum += qlp_coeff[0] * data[i-1];
456                                                 residual[i] = data[i] - (sum >> lp_quantization);
457                                         }
458                                 }
459                                 else { /* order == 3 */
460                                         for(i = 0; i < (int)data_len; i++) {
461                                                 sum = 0;
462                                                 sum += qlp_coeff[2] * data[i-3];
463                                                 sum += qlp_coeff[1] * data[i-2];
464                                                 sum += qlp_coeff[0] * data[i-1];
465                                                 residual[i] = data[i] - (sum >> lp_quantization);
466                                         }
467                                 }
468                         }
469                         else {
470                                 if(order == 2) {
471                                         for(i = 0; i < (int)data_len; i++) {
472                                                 sum = 0;
473                                                 sum += qlp_coeff[1] * data[i-2];
474                                                 sum += qlp_coeff[0] * data[i-1];
475                                                 residual[i] = data[i] - (sum >> lp_quantization);
476                                         }
477                                 }
478                                 else { /* order == 1 */
479                                         for(i = 0; i < (int)data_len; i++)
480                                                 residual[i] = data[i] - ((qlp_coeff[0] * data[i-1]) >> lp_quantization);
481                                 }
482                         }
483                 }
484         }
485         else { /* order > 12 */
486                 for(i = 0; i < (int)data_len; i++) {
487                         sum = 0;
488                         switch(order) {
489                                 case 32: sum += qlp_coeff[31] * data[i-32];
490                                 case 31: sum += qlp_coeff[30] * data[i-31];
491                                 case 30: sum += qlp_coeff[29] * data[i-30];
492                                 case 29: sum += qlp_coeff[28] * data[i-29];
493                                 case 28: sum += qlp_coeff[27] * data[i-28];
494                                 case 27: sum += qlp_coeff[26] * data[i-27];
495                                 case 26: sum += qlp_coeff[25] * data[i-26];
496                                 case 25: sum += qlp_coeff[24] * data[i-25];
497                                 case 24: sum += qlp_coeff[23] * data[i-24];
498                                 case 23: sum += qlp_coeff[22] * data[i-23];
499                                 case 22: sum += qlp_coeff[21] * data[i-22];
500                                 case 21: sum += qlp_coeff[20] * data[i-21];
501                                 case 20: sum += qlp_coeff[19] * data[i-20];
502                                 case 19: sum += qlp_coeff[18] * data[i-19];
503                                 case 18: sum += qlp_coeff[17] * data[i-18];
504                                 case 17: sum += qlp_coeff[16] * data[i-17];
505                                 case 16: sum += qlp_coeff[15] * data[i-16];
506                                 case 15: sum += qlp_coeff[14] * data[i-15];
507                                 case 14: sum += qlp_coeff[13] * data[i-14];
508                                 case 13: sum += qlp_coeff[12] * data[i-13];
509                                          sum += qlp_coeff[11] * data[i-12];
510                                          sum += qlp_coeff[10] * data[i-11];
511                                          sum += qlp_coeff[ 9] * data[i-10];
512                                          sum += qlp_coeff[ 8] * data[i- 9];
513                                          sum += qlp_coeff[ 7] * data[i- 8];
514                                          sum += qlp_coeff[ 6] * data[i- 7];
515                                          sum += qlp_coeff[ 5] * data[i- 6];
516                                          sum += qlp_coeff[ 4] * data[i- 5];
517                                          sum += qlp_coeff[ 3] * data[i- 4];
518                                          sum += qlp_coeff[ 2] * data[i- 3];
519                                          sum += qlp_coeff[ 1] * data[i- 2];
520                                          sum += qlp_coeff[ 0] * data[i- 1];
521                         }
522                         residual[i] = data[i] - (sum >> lp_quantization);
523                 }
524         }
525 }
526 #endif
527
528 void FLAC__lpc_compute_residual_from_qlp_coefficients_wide(const FLAC__int32 *data, unsigned data_len, const FLAC__int32 qlp_coeff[], unsigned order, int lp_quantization, FLAC__int32 residual[])
529 #if defined(FLAC__OVERFLOW_DETECT) || !defined(FLAC__LPC_UNROLLED_FILTER_LOOPS)
530 {
531         unsigned i, j;
532         FLAC__int64 sum;
533         const FLAC__int32 *history;
534
535 #ifdef FLAC__OVERFLOW_DETECT_VERBOSE
536         fprintf(stderr,"FLAC__lpc_compute_residual_from_qlp_coefficients_wide: data_len=%d, order=%u, lpq=%d",data_len,order,lp_quantization);
537         for(i=0;i<order;i++)
538                 fprintf(stderr,", q[%u]=%d",i,qlp_coeff[i]);
539         fprintf(stderr,"\n");
540 #endif
541         FLAC__ASSERT(order > 0);
542
543         for(i = 0; i < data_len; i++) {
544                 sum = 0;
545                 history = data;
546                 for(j = 0; j < order; j++)
547                         sum += (FLAC__int64)qlp_coeff[j] * (FLAC__int64)(*(--history));
548                 if(FLAC__bitmath_silog2_wide(sum >> lp_quantization) > 32) {
549                         fprintf(stderr,"FLAC__lpc_compute_residual_from_qlp_coefficients_wide: OVERFLOW, i=%u, sum=%" PRId64 "\n", i, (sum >> lp_quantization));
550                         break;
551                 }
552                 if(FLAC__bitmath_silog2_wide((FLAC__int64)(*data) - (sum >> lp_quantization)) > 32) {
553                         fprintf(stderr,"FLAC__lpc_compute_residual_from_qlp_coefficients_wide: OVERFLOW, i=%u, data=%d, sum=%" PRId64 ", residual=%" PRId64 "\n", i, *data, (long long)(sum >> lp_quantization), ((FLAC__int64)(*data) - (sum >> lp_quantization)));
554                         break;
555                 }
556                 *(residual++) = *(data++) - (FLAC__int32)(sum >> lp_quantization);
557         }
558 }
559 #else /* fully unrolled version for normal use */
560 {
561         int i;
562         FLAC__int64 sum;
563
564         FLAC__ASSERT(order > 0);
565         FLAC__ASSERT(order <= 32);
566
567         /*
568          * We do unique versions up to 12th order since that's the subset limit.
569          * Also they are roughly ordered to match frequency of occurrence to
570          * minimize branching.
571          */
572         if(order <= 12) {
573                 if(order > 8) {
574                         if(order > 10) {
575                                 if(order == 12) {
576                                         for(i = 0; i < (int)data_len; i++) {
577                                                 sum = 0;
578                                                 sum += qlp_coeff[11] * (FLAC__int64)data[i-12];
579                                                 sum += qlp_coeff[10] * (FLAC__int64)data[i-11];
580                                                 sum += qlp_coeff[9] * (FLAC__int64)data[i-10];
581                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
582                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
583                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
584                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
585                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
586                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
587                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
588                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
589                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
590                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
591                                         }
592                                 }
593                                 else { /* order == 11 */
594                                         for(i = 0; i < (int)data_len; i++) {
595                                                 sum = 0;
596                                                 sum += qlp_coeff[10] * (FLAC__int64)data[i-11];
597                                                 sum += qlp_coeff[9] * (FLAC__int64)data[i-10];
598                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
599                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
600                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
601                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
602                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
603                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
604                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
605                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
606                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
607                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
608                                         }
609                                 }
610                         }
611                         else {
612                                 if(order == 10) {
613                                         for(i = 0; i < (int)data_len; i++) {
614                                                 sum = 0;
615                                                 sum += qlp_coeff[9] * (FLAC__int64)data[i-10];
616                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
617                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
618                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
619                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
620                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
621                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
622                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
623                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
624                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
625                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
626                                         }
627                                 }
628                                 else { /* order == 9 */
629                                         for(i = 0; i < (int)data_len; i++) {
630                                                 sum = 0;
631                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
632                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
633                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
634                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
635                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
636                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
637                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
638                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
639                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
640                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
641                                         }
642                                 }
643                         }
644                 }
645                 else if(order > 4) {
646                         if(order > 6) {
647                                 if(order == 8) {
648                                         for(i = 0; i < (int)data_len; i++) {
649                                                 sum = 0;
650                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
651                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
652                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
653                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
654                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
655                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
656                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
657                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
658                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
659                                         }
660                                 }
661                                 else { /* order == 7 */
662                                         for(i = 0; i < (int)data_len; i++) {
663                                                 sum = 0;
664                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
665                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
666                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
667                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
668                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
669                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
670                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
671                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
672                                         }
673                                 }
674                         }
675                         else {
676                                 if(order == 6) {
677                                         for(i = 0; i < (int)data_len; i++) {
678                                                 sum = 0;
679                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
680                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
681                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
682                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
683                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
684                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
685                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
686                                         }
687                                 }
688                                 else { /* order == 5 */
689                                         for(i = 0; i < (int)data_len; i++) {
690                                                 sum = 0;
691                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
692                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
693                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
694                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
695                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
696                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
697                                         }
698                                 }
699                         }
700                 }
701                 else {
702                         if(order > 2) {
703                                 if(order == 4) {
704                                         for(i = 0; i < (int)data_len; i++) {
705                                                 sum = 0;
706                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
707                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
708                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
709                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
710                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
711                                         }
712                                 }
713                                 else { /* order == 3 */
714                                         for(i = 0; i < (int)data_len; i++) {
715                                                 sum = 0;
716                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
717                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
718                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
719                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
720                                         }
721                                 }
722                         }
723                         else {
724                                 if(order == 2) {
725                                         for(i = 0; i < (int)data_len; i++) {
726                                                 sum = 0;
727                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
728                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
729                                                 residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
730                                         }
731                                 }
732                                 else { /* order == 1 */
733                                         for(i = 0; i < (int)data_len; i++)
734                                                 residual[i] = data[i] - (FLAC__int32)((qlp_coeff[0] * (FLAC__int64)data[i-1]) >> lp_quantization);
735                                 }
736                         }
737                 }
738         }
739         else { /* order > 12 */
740                 for(i = 0; i < (int)data_len; i++) {
741                         sum = 0;
742                         switch(order) {
743                                 case 32: sum += qlp_coeff[31] * (FLAC__int64)data[i-32];
744                                 case 31: sum += qlp_coeff[30] * (FLAC__int64)data[i-31];
745                                 case 30: sum += qlp_coeff[29] * (FLAC__int64)data[i-30];
746                                 case 29: sum += qlp_coeff[28] * (FLAC__int64)data[i-29];
747                                 case 28: sum += qlp_coeff[27] * (FLAC__int64)data[i-28];
748                                 case 27: sum += qlp_coeff[26] * (FLAC__int64)data[i-27];
749                                 case 26: sum += qlp_coeff[25] * (FLAC__int64)data[i-26];
750                                 case 25: sum += qlp_coeff[24] * (FLAC__int64)data[i-25];
751                                 case 24: sum += qlp_coeff[23] * (FLAC__int64)data[i-24];
752                                 case 23: sum += qlp_coeff[22] * (FLAC__int64)data[i-23];
753                                 case 22: sum += qlp_coeff[21] * (FLAC__int64)data[i-22];
754                                 case 21: sum += qlp_coeff[20] * (FLAC__int64)data[i-21];
755                                 case 20: sum += qlp_coeff[19] * (FLAC__int64)data[i-20];
756                                 case 19: sum += qlp_coeff[18] * (FLAC__int64)data[i-19];
757                                 case 18: sum += qlp_coeff[17] * (FLAC__int64)data[i-18];
758                                 case 17: sum += qlp_coeff[16] * (FLAC__int64)data[i-17];
759                                 case 16: sum += qlp_coeff[15] * (FLAC__int64)data[i-16];
760                                 case 15: sum += qlp_coeff[14] * (FLAC__int64)data[i-15];
761                                 case 14: sum += qlp_coeff[13] * (FLAC__int64)data[i-14];
762                                 case 13: sum += qlp_coeff[12] * (FLAC__int64)data[i-13];
763                                          sum += qlp_coeff[11] * (FLAC__int64)data[i-12];
764                                          sum += qlp_coeff[10] * (FLAC__int64)data[i-11];
765                                          sum += qlp_coeff[ 9] * (FLAC__int64)data[i-10];
766                                          sum += qlp_coeff[ 8] * (FLAC__int64)data[i- 9];
767                                          sum += qlp_coeff[ 7] * (FLAC__int64)data[i- 8];
768                                          sum += qlp_coeff[ 6] * (FLAC__int64)data[i- 7];
769                                          sum += qlp_coeff[ 5] * (FLAC__int64)data[i- 6];
770                                          sum += qlp_coeff[ 4] * (FLAC__int64)data[i- 5];
771                                          sum += qlp_coeff[ 3] * (FLAC__int64)data[i- 4];
772                                          sum += qlp_coeff[ 2] * (FLAC__int64)data[i- 3];
773                                          sum += qlp_coeff[ 1] * (FLAC__int64)data[i- 2];
774                                          sum += qlp_coeff[ 0] * (FLAC__int64)data[i- 1];
775                         }
776                         residual[i] = data[i] - (FLAC__int32)(sum >> lp_quantization);
777                 }
778         }
779 }
780 #endif
781
782 #endif /* !defined FLAC__INTEGER_ONLY_LIBRARY */
783
784 void FLAC__lpc_restore_signal(const FLAC__int32 residual[], unsigned data_len, const FLAC__int32 qlp_coeff[], unsigned order, int lp_quantization, FLAC__int32 data[])
785 #if defined(FLAC__OVERFLOW_DETECT) || !defined(FLAC__LPC_UNROLLED_FILTER_LOOPS)
786 {
787         FLAC__int64 sumo;
788         unsigned i, j;
789         FLAC__int32 sum;
790         const FLAC__int32 *r = residual, *history;
791
792 #ifdef FLAC__OVERFLOW_DETECT_VERBOSE
793         fprintf(stderr,"FLAC__lpc_restore_signal: data_len=%d, order=%u, lpq=%d",data_len,order,lp_quantization);
794         for(i=0;i<order;i++)
795                 fprintf(stderr,", q[%u]=%d",i,qlp_coeff[i]);
796         fprintf(stderr,"\n");
797 #endif
798         FLAC__ASSERT(order > 0);
799
800         for(i = 0; i < data_len; i++) {
801                 sumo = 0;
802                 sum = 0;
803                 history = data;
804                 for(j = 0; j < order; j++) {
805                         sum += qlp_coeff[j] * (*(--history));
806                         sumo += (FLAC__int64)qlp_coeff[j] * (FLAC__int64)(*history);
807                         if(sumo > 2147483647ll || sumo < -2147483648ll)
808                                 fprintf(stderr,"FLAC__lpc_restore_signal: OVERFLOW, i=%u, j=%u, c=%d, d=%d, sumo=%" PRId64 "\n",i,j,qlp_coeff[j],*history,sumo);
809                 }
810                 *(data++) = *(r++) + (sum >> lp_quantization);
811         }
812
813         /* Here's a slower but clearer version:
814         for(i = 0; i < data_len; i++) {
815                 sum = 0;
816                 for(j = 0; j < order; j++)
817                         sum += qlp_coeff[j] * data[i-j-1];
818                 data[i] = residual[i] + (sum >> lp_quantization);
819         }
820         */
821 }
822 #else /* fully unrolled version for normal use */
823 {
824         int i;
825         FLAC__int32 sum;
826
827         FLAC__ASSERT(order > 0);
828         FLAC__ASSERT(order <= 32);
829
830         /*
831          * We do unique versions up to 12th order since that's the subset limit.
832          * Also they are roughly ordered to match frequency of occurrence to
833          * minimize branching.
834          */
835         if(order <= 12) {
836                 if(order > 8) {
837                         if(order > 10) {
838                                 if(order == 12) {
839                                         for(i = 0; i < (int)data_len; i++) {
840                                                 sum = 0;
841                                                 sum += qlp_coeff[11] * data[i-12];
842                                                 sum += qlp_coeff[10] * data[i-11];
843                                                 sum += qlp_coeff[9] * data[i-10];
844                                                 sum += qlp_coeff[8] * data[i-9];
845                                                 sum += qlp_coeff[7] * data[i-8];
846                                                 sum += qlp_coeff[6] * data[i-7];
847                                                 sum += qlp_coeff[5] * data[i-6];
848                                                 sum += qlp_coeff[4] * data[i-5];
849                                                 sum += qlp_coeff[3] * data[i-4];
850                                                 sum += qlp_coeff[2] * data[i-3];
851                                                 sum += qlp_coeff[1] * data[i-2];
852                                                 sum += qlp_coeff[0] * data[i-1];
853                                                 data[i] = residual[i] + (sum >> lp_quantization);
854                                         }
855                                 }
856                                 else { /* order == 11 */
857                                         for(i = 0; i < (int)data_len; i++) {
858                                                 sum = 0;
859                                                 sum += qlp_coeff[10] * data[i-11];
860                                                 sum += qlp_coeff[9] * data[i-10];
861                                                 sum += qlp_coeff[8] * data[i-9];
862                                                 sum += qlp_coeff[7] * data[i-8];
863                                                 sum += qlp_coeff[6] * data[i-7];
864                                                 sum += qlp_coeff[5] * data[i-6];
865                                                 sum += qlp_coeff[4] * data[i-5];
866                                                 sum += qlp_coeff[3] * data[i-4];
867                                                 sum += qlp_coeff[2] * data[i-3];
868                                                 sum += qlp_coeff[1] * data[i-2];
869                                                 sum += qlp_coeff[0] * data[i-1];
870                                                 data[i] = residual[i] + (sum >> lp_quantization);
871                                         }
872                                 }
873                         }
874                         else {
875                                 if(order == 10) {
876                                         for(i = 0; i < (int)data_len; i++) {
877                                                 sum = 0;
878                                                 sum += qlp_coeff[9] * data[i-10];
879                                                 sum += qlp_coeff[8] * data[i-9];
880                                                 sum += qlp_coeff[7] * data[i-8];
881                                                 sum += qlp_coeff[6] * data[i-7];
882                                                 sum += qlp_coeff[5] * data[i-6];
883                                                 sum += qlp_coeff[4] * data[i-5];
884                                                 sum += qlp_coeff[3] * data[i-4];
885                                                 sum += qlp_coeff[2] * data[i-3];
886                                                 sum += qlp_coeff[1] * data[i-2];
887                                                 sum += qlp_coeff[0] * data[i-1];
888                                                 data[i] = residual[i] + (sum >> lp_quantization);
889                                         }
890                                 }
891                                 else { /* order == 9 */
892                                         for(i = 0; i < (int)data_len; i++) {
893                                                 sum = 0;
894                                                 sum += qlp_coeff[8] * data[i-9];
895                                                 sum += qlp_coeff[7] * data[i-8];
896                                                 sum += qlp_coeff[6] * data[i-7];
897                                                 sum += qlp_coeff[5] * data[i-6];
898                                                 sum += qlp_coeff[4] * data[i-5];
899                                                 sum += qlp_coeff[3] * data[i-4];
900                                                 sum += qlp_coeff[2] * data[i-3];
901                                                 sum += qlp_coeff[1] * data[i-2];
902                                                 sum += qlp_coeff[0] * data[i-1];
903                                                 data[i] = residual[i] + (sum >> lp_quantization);
904                                         }
905                                 }
906                         }
907                 }
908                 else if(order > 4) {
909                         if(order > 6) {
910                                 if(order == 8) {
911                                         for(i = 0; i < (int)data_len; i++) {
912                                                 sum = 0;
913                                                 sum += qlp_coeff[7] * data[i-8];
914                                                 sum += qlp_coeff[6] * data[i-7];
915                                                 sum += qlp_coeff[5] * data[i-6];
916                                                 sum += qlp_coeff[4] * data[i-5];
917                                                 sum += qlp_coeff[3] * data[i-4];
918                                                 sum += qlp_coeff[2] * data[i-3];
919                                                 sum += qlp_coeff[1] * data[i-2];
920                                                 sum += qlp_coeff[0] * data[i-1];
921                                                 data[i] = residual[i] + (sum >> lp_quantization);
922                                         }
923                                 }
924                                 else { /* order == 7 */
925                                         for(i = 0; i < (int)data_len; i++) {
926                                                 sum = 0;
927                                                 sum += qlp_coeff[6] * data[i-7];
928                                                 sum += qlp_coeff[5] * data[i-6];
929                                                 sum += qlp_coeff[4] * data[i-5];
930                                                 sum += qlp_coeff[3] * data[i-4];
931                                                 sum += qlp_coeff[2] * data[i-3];
932                                                 sum += qlp_coeff[1] * data[i-2];
933                                                 sum += qlp_coeff[0] * data[i-1];
934                                                 data[i] = residual[i] + (sum >> lp_quantization);
935                                         }
936                                 }
937                         }
938                         else {
939                                 if(order == 6) {
940                                         for(i = 0; i < (int)data_len; i++) {
941                                                 sum = 0;
942                                                 sum += qlp_coeff[5] * data[i-6];
943                                                 sum += qlp_coeff[4] * data[i-5];
944                                                 sum += qlp_coeff[3] * data[i-4];
945                                                 sum += qlp_coeff[2] * data[i-3];
946                                                 sum += qlp_coeff[1] * data[i-2];
947                                                 sum += qlp_coeff[0] * data[i-1];
948                                                 data[i] = residual[i] + (sum >> lp_quantization);
949                                         }
950                                 }
951                                 else { /* order == 5 */
952                                         for(i = 0; i < (int)data_len; i++) {
953                                                 sum = 0;
954                                                 sum += qlp_coeff[4] * data[i-5];
955                                                 sum += qlp_coeff[3] * data[i-4];
956                                                 sum += qlp_coeff[2] * data[i-3];
957                                                 sum += qlp_coeff[1] * data[i-2];
958                                                 sum += qlp_coeff[0] * data[i-1];
959                                                 data[i] = residual[i] + (sum >> lp_quantization);
960                                         }
961                                 }
962                         }
963                 }
964                 else {
965                         if(order > 2) {
966                                 if(order == 4) {
967                                         for(i = 0; i < (int)data_len; i++) {
968                                                 sum = 0;
969                                                 sum += qlp_coeff[3] * data[i-4];
970                                                 sum += qlp_coeff[2] * data[i-3];
971                                                 sum += qlp_coeff[1] * data[i-2];
972                                                 sum += qlp_coeff[0] * data[i-1];
973                                                 data[i] = residual[i] + (sum >> lp_quantization);
974                                         }
975                                 }
976                                 else { /* order == 3 */
977                                         for(i = 0; i < (int)data_len; i++) {
978                                                 sum = 0;
979                                                 sum += qlp_coeff[2] * data[i-3];
980                                                 sum += qlp_coeff[1] * data[i-2];
981                                                 sum += qlp_coeff[0] * data[i-1];
982                                                 data[i] = residual[i] + (sum >> lp_quantization);
983                                         }
984                                 }
985                         }
986                         else {
987                                 if(order == 2) {
988                                         for(i = 0; i < (int)data_len; i++) {
989                                                 sum = 0;
990                                                 sum += qlp_coeff[1] * data[i-2];
991                                                 sum += qlp_coeff[0] * data[i-1];
992                                                 data[i] = residual[i] + (sum >> lp_quantization);
993                                         }
994                                 }
995                                 else { /* order == 1 */
996                                         for(i = 0; i < (int)data_len; i++)
997                                                 data[i] = residual[i] + ((qlp_coeff[0] * data[i-1]) >> lp_quantization);
998                                 }
999                         }
1000                 }
1001         }
1002         else { /* order > 12 */
1003                 for(i = 0; i < (int)data_len; i++) {
1004                         sum = 0;
1005                         switch(order) {
1006                                 case 32: sum += qlp_coeff[31] * data[i-32];
1007                                 case 31: sum += qlp_coeff[30] * data[i-31];
1008                                 case 30: sum += qlp_coeff[29] * data[i-30];
1009                                 case 29: sum += qlp_coeff[28] * data[i-29];
1010                                 case 28: sum += qlp_coeff[27] * data[i-28];
1011                                 case 27: sum += qlp_coeff[26] * data[i-27];
1012                                 case 26: sum += qlp_coeff[25] * data[i-26];
1013                                 case 25: sum += qlp_coeff[24] * data[i-25];
1014                                 case 24: sum += qlp_coeff[23] * data[i-24];
1015                                 case 23: sum += qlp_coeff[22] * data[i-23];
1016                                 case 22: sum += qlp_coeff[21] * data[i-22];
1017                                 case 21: sum += qlp_coeff[20] * data[i-21];
1018                                 case 20: sum += qlp_coeff[19] * data[i-20];
1019                                 case 19: sum += qlp_coeff[18] * data[i-19];
1020                                 case 18: sum += qlp_coeff[17] * data[i-18];
1021                                 case 17: sum += qlp_coeff[16] * data[i-17];
1022                                 case 16: sum += qlp_coeff[15] * data[i-16];
1023                                 case 15: sum += qlp_coeff[14] * data[i-15];
1024                                 case 14: sum += qlp_coeff[13] * data[i-14];
1025                                 case 13: sum += qlp_coeff[12] * data[i-13];
1026                                          sum += qlp_coeff[11] * data[i-12];
1027                                          sum += qlp_coeff[10] * data[i-11];
1028                                          sum += qlp_coeff[ 9] * data[i-10];
1029                                          sum += qlp_coeff[ 8] * data[i- 9];
1030                                          sum += qlp_coeff[ 7] * data[i- 8];
1031                                          sum += qlp_coeff[ 6] * data[i- 7];
1032                                          sum += qlp_coeff[ 5] * data[i- 6];
1033                                          sum += qlp_coeff[ 4] * data[i- 5];
1034                                          sum += qlp_coeff[ 3] * data[i- 4];
1035                                          sum += qlp_coeff[ 2] * data[i- 3];
1036                                          sum += qlp_coeff[ 1] * data[i- 2];
1037                                          sum += qlp_coeff[ 0] * data[i- 1];
1038                         }
1039                         data[i] = residual[i] + (sum >> lp_quantization);
1040                 }
1041         }
1042 }
1043 #endif
1044
1045 void FLAC__lpc_restore_signal_wide(const FLAC__int32 residual[], unsigned data_len, const FLAC__int32 qlp_coeff[], unsigned order, int lp_quantization, FLAC__int32 data[])
1046 #if defined(FLAC__OVERFLOW_DETECT) || !defined(FLAC__LPC_UNROLLED_FILTER_LOOPS)
1047 {
1048         unsigned i, j;
1049         FLAC__int64 sum;
1050         const FLAC__int32 *r = residual, *history;
1051
1052 #ifdef FLAC__OVERFLOW_DETECT_VERBOSE
1053         fprintf(stderr,"FLAC__lpc_restore_signal_wide: data_len=%d, order=%u, lpq=%d",data_len,order,lp_quantization);
1054         for(i=0;i<order;i++)
1055                 fprintf(stderr,", q[%u]=%d",i,qlp_coeff[i]);
1056         fprintf(stderr,"\n");
1057 #endif
1058         FLAC__ASSERT(order > 0);
1059
1060         for(i = 0; i < data_len; i++) {
1061                 sum = 0;
1062                 history = data;
1063                 for(j = 0; j < order; j++)
1064                         sum += (FLAC__int64)qlp_coeff[j] * (FLAC__int64)(*(--history));
1065                 if(FLAC__bitmath_silog2_wide(sum >> lp_quantization) > 32) {
1066                         fprintf(stderr,"FLAC__lpc_restore_signal_wide: OVERFLOW, i=%u, sum=%" PRId64 "\n", i, (sum >> lp_quantization));
1067                         break;
1068                 }
1069                 if(FLAC__bitmath_silog2_wide((FLAC__int64)(*r) + (sum >> lp_quantization)) > 32) {
1070                         fprintf(stderr,"FLAC__lpc_restore_signal_wide: OVERFLOW, i=%u, residual=%d, sum=%" PRId64 ", data=%" PRId64 "\n", i, *r, (sum >> lp_quantization), ((FLAC__int64)(*r) + (sum >> lp_quantization)));
1071                         break;
1072                 }
1073                 *(data++) = *(r++) + (FLAC__int32)(sum >> lp_quantization);
1074         }
1075 }
1076 #else /* fully unrolled version for normal use */
1077 {
1078         int i;
1079         FLAC__int64 sum;
1080
1081         FLAC__ASSERT(order > 0);
1082         FLAC__ASSERT(order <= 32);
1083
1084         /*
1085          * We do unique versions up to 12th order since that's the subset limit.
1086          * Also they are roughly ordered to match frequency of occurrence to
1087          * minimize branching.
1088          */
1089         if(order <= 12) {
1090                 if(order > 8) {
1091                         if(order > 10) {
1092                                 if(order == 12) {
1093                                         for(i = 0; i < (int)data_len; i++) {
1094                                                 sum = 0;
1095                                                 sum += qlp_coeff[11] * (FLAC__int64)data[i-12];
1096                                                 sum += qlp_coeff[10] * (FLAC__int64)data[i-11];
1097                                                 sum += qlp_coeff[9] * (FLAC__int64)data[i-10];
1098                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
1099                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
1100                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
1101                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
1102                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1103                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1104                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1105                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1106                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1107                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1108                                         }
1109                                 }
1110                                 else { /* order == 11 */
1111                                         for(i = 0; i < (int)data_len; i++) {
1112                                                 sum = 0;
1113                                                 sum += qlp_coeff[10] * (FLAC__int64)data[i-11];
1114                                                 sum += qlp_coeff[9] * (FLAC__int64)data[i-10];
1115                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
1116                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
1117                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
1118                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
1119                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1120                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1121                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1122                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1123                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1124                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1125                                         }
1126                                 }
1127                         }
1128                         else {
1129                                 if(order == 10) {
1130                                         for(i = 0; i < (int)data_len; i++) {
1131                                                 sum = 0;
1132                                                 sum += qlp_coeff[9] * (FLAC__int64)data[i-10];
1133                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
1134                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
1135                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
1136                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
1137                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1138                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1139                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1140                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1141                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1142                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1143                                         }
1144                                 }
1145                                 else { /* order == 9 */
1146                                         for(i = 0; i < (int)data_len; i++) {
1147                                                 sum = 0;
1148                                                 sum += qlp_coeff[8] * (FLAC__int64)data[i-9];
1149                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
1150                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
1151                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
1152                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1153                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1154                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1155                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1156                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1157                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1158                                         }
1159                                 }
1160                         }
1161                 }
1162                 else if(order > 4) {
1163                         if(order > 6) {
1164                                 if(order == 8) {
1165                                         for(i = 0; i < (int)data_len; i++) {
1166                                                 sum = 0;
1167                                                 sum += qlp_coeff[7] * (FLAC__int64)data[i-8];
1168                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
1169                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
1170                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1171                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1172                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1173                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1174                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1175                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1176                                         }
1177                                 }
1178                                 else { /* order == 7 */
1179                                         for(i = 0; i < (int)data_len; i++) {
1180                                                 sum = 0;
1181                                                 sum += qlp_coeff[6] * (FLAC__int64)data[i-7];
1182                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
1183                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1184                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1185                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1186                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1187                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1188                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1189                                         }
1190                                 }
1191                         }
1192                         else {
1193                                 if(order == 6) {
1194                                         for(i = 0; i < (int)data_len; i++) {
1195                                                 sum = 0;
1196                                                 sum += qlp_coeff[5] * (FLAC__int64)data[i-6];
1197                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1198                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1199                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1200                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1201                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1202                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1203                                         }
1204                                 }
1205                                 else { /* order == 5 */
1206                                         for(i = 0; i < (int)data_len; i++) {
1207                                                 sum = 0;
1208                                                 sum += qlp_coeff[4] * (FLAC__int64)data[i-5];
1209                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1210                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1211                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1212                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1213                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1214                                         }
1215                                 }
1216                         }
1217                 }
1218                 else {
1219                         if(order > 2) {
1220                                 if(order == 4) {
1221                                         for(i = 0; i < (int)data_len; i++) {
1222                                                 sum = 0;
1223                                                 sum += qlp_coeff[3] * (FLAC__int64)data[i-4];
1224                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1225                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1226                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1227                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1228                                         }
1229                                 }
1230                                 else { /* order == 3 */
1231                                         for(i = 0; i < (int)data_len; i++) {
1232                                                 sum = 0;
1233                                                 sum += qlp_coeff[2] * (FLAC__int64)data[i-3];
1234                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1235                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1236                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1237                                         }
1238                                 }
1239                         }
1240                         else {
1241                                 if(order == 2) {
1242                                         for(i = 0; i < (int)data_len; i++) {
1243                                                 sum = 0;
1244                                                 sum += qlp_coeff[1] * (FLAC__int64)data[i-2];
1245                                                 sum += qlp_coeff[0] * (FLAC__int64)data[i-1];
1246                                                 data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1247                                         }
1248                                 }
1249                                 else { /* order == 1 */
1250                                         for(i = 0; i < (int)data_len; i++)
1251                                                 data[i] = residual[i] + (FLAC__int32)((qlp_coeff[0] * (FLAC__int64)data[i-1]) >> lp_quantization);
1252                                 }
1253                         }
1254                 }
1255         }
1256         else { /* order > 12 */
1257                 for(i = 0; i < (int)data_len; i++) {
1258                         sum = 0;
1259                         switch(order) {
1260                                 case 32: sum += qlp_coeff[31] * (FLAC__int64)data[i-32];
1261                                 case 31: sum += qlp_coeff[30] * (FLAC__int64)data[i-31];
1262                                 case 30: sum += qlp_coeff[29] * (FLAC__int64)data[i-30];
1263                                 case 29: sum += qlp_coeff[28] * (FLAC__int64)data[i-29];
1264                                 case 28: sum += qlp_coeff[27] * (FLAC__int64)data[i-28];
1265                                 case 27: sum += qlp_coeff[26] * (FLAC__int64)data[i-27];
1266                                 case 26: sum += qlp_coeff[25] * (FLAC__int64)data[i-26];
1267                                 case 25: sum += qlp_coeff[24] * (FLAC__int64)data[i-25];
1268                                 case 24: sum += qlp_coeff[23] * (FLAC__int64)data[i-24];
1269                                 case 23: sum += qlp_coeff[22] * (FLAC__int64)data[i-23];
1270                                 case 22: sum += qlp_coeff[21] * (FLAC__int64)data[i-22];
1271                                 case 21: sum += qlp_coeff[20] * (FLAC__int64)data[i-21];
1272                                 case 20: sum += qlp_coeff[19] * (FLAC__int64)data[i-20];
1273                                 case 19: sum += qlp_coeff[18] * (FLAC__int64)data[i-19];
1274                                 case 18: sum += qlp_coeff[17] * (FLAC__int64)data[i-18];
1275                                 case 17: sum += qlp_coeff[16] * (FLAC__int64)data[i-17];
1276                                 case 16: sum += qlp_coeff[15] * (FLAC__int64)data[i-16];
1277                                 case 15: sum += qlp_coeff[14] * (FLAC__int64)data[i-15];
1278                                 case 14: sum += qlp_coeff[13] * (FLAC__int64)data[i-14];
1279                                 case 13: sum += qlp_coeff[12] * (FLAC__int64)data[i-13];
1280                                          sum += qlp_coeff[11] * (FLAC__int64)data[i-12];
1281                                          sum += qlp_coeff[10] * (FLAC__int64)data[i-11];
1282                                          sum += qlp_coeff[ 9] * (FLAC__int64)data[i-10];
1283                                          sum += qlp_coeff[ 8] * (FLAC__int64)data[i- 9];
1284                                          sum += qlp_coeff[ 7] * (FLAC__int64)data[i- 8];
1285                                          sum += qlp_coeff[ 6] * (FLAC__int64)data[i- 7];
1286                                          sum += qlp_coeff[ 5] * (FLAC__int64)data[i- 6];
1287                                          sum += qlp_coeff[ 4] * (FLAC__int64)data[i- 5];
1288                                          sum += qlp_coeff[ 3] * (FLAC__int64)data[i- 4];
1289                                          sum += qlp_coeff[ 2] * (FLAC__int64)data[i- 3];
1290                                          sum += qlp_coeff[ 1] * (FLAC__int64)data[i- 2];
1291                                          sum += qlp_coeff[ 0] * (FLAC__int64)data[i- 1];
1292                         }
1293                         data[i] = residual[i] + (FLAC__int32)(sum >> lp_quantization);
1294                 }
1295         }
1296 }
1297 #endif
1298
1299 #ifndef FLAC__INTEGER_ONLY_LIBRARY
1300
1301 FLAC__double FLAC__lpc_compute_expected_bits_per_residual_sample(FLAC__double lpc_error, unsigned total_samples)
1302 {
1303         FLAC__double error_scale;
1304
1305         FLAC__ASSERT(total_samples > 0);
1306
1307         error_scale = 0.5 * M_LN2 * M_LN2 / (FLAC__double)total_samples;
1308
1309         return FLAC__lpc_compute_expected_bits_per_residual_sample_with_error_scale(lpc_error, error_scale);
1310 }
1311
1312 FLAC__double FLAC__lpc_compute_expected_bits_per_residual_sample_with_error_scale(FLAC__double lpc_error, FLAC__double error_scale)
1313 {
1314         if(lpc_error > 0.0) {
1315                 FLAC__double bps = (FLAC__double)0.5 * log(error_scale * lpc_error) / M_LN2;
1316                 if(bps >= 0.0)
1317                         return bps;
1318                 else
1319                         return 0.0;
1320         }
1321         else if(lpc_error < 0.0) { /* error should not be negative but can happen due to inadequate floating-point resolution */
1322                 return 1e32;
1323         }
1324         else {
1325                 return 0.0;
1326         }
1327 }
1328
1329 unsigned FLAC__lpc_compute_best_order(const FLAC__double lpc_error[], unsigned max_order, unsigned total_samples, unsigned overhead_bits_per_order)
1330 {
1331         unsigned order, indx, best_index; /* 'index' the index into lpc_error; index==order-1 since lpc_error[0] is for order==1, lpc_error[1] is for order==2, etc */
1332         FLAC__double bits, best_bits, error_scale;
1333
1334         FLAC__ASSERT(max_order > 0);
1335         FLAC__ASSERT(total_samples > 0);
1336
1337         error_scale = 0.5 * M_LN2 * M_LN2 / (FLAC__double)total_samples;
1338
1339         best_index = 0;
1340         best_bits = (unsigned)(-1);
1341
1342         for(indx = 0, order = 1; indx < max_order; indx++, order++) {
1343                 bits = FLAC__lpc_compute_expected_bits_per_residual_sample_with_error_scale(lpc_error[indx], error_scale) * (FLAC__double)(total_samples - order) + (FLAC__double)(order * overhead_bits_per_order);
1344                 if(bits < best_bits) {
1345                         best_index = indx;
1346                         best_bits = bits;
1347                 }
1348         }
1349
1350         return best_index+1; /* +1 since indx of lpc_error[] is order-1 */
1351 }
1352
1353 #endif /* !defined FLAC__INTEGER_ONLY_LIBRARY */