2 * simple math operations
3 * Copyright (c) 2001, 2002 Fabrice Bellard
4 * Copyright (c) 2006 Michael Niedermayer <michaelni@gmx.at> et al
6 * This file is part of FFmpeg.
8 * FFmpeg is free software; you can redistribute it and/or
9 * modify it under the terms of the GNU Lesser General Public
10 * License as published by the Free Software Foundation; either
11 * version 2.1 of the License, or (at your option) any later version.
13 * FFmpeg is distributed in the hope that it will be useful,
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
16 * Lesser General Public License for more details.
18 * You should have received a copy of the GNU Lesser General Public
19 * License along with FFmpeg; if not, write to the Free Software
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
22 #ifndef AVCODEC_MATHOPS_H
23 #define AVCODEC_MATHOPS_H
27 #include "libavutil/attributes_internal.h"
28 #include "libavutil/common.h"
31 #define MAX_NEG_CROP 1024
33 extern const uint32_t ff_inverse[257];
34 extern const uint8_t ff_log2_run[41];
35 extern const uint8_t ff_sqrt_tab[256];
36 extern const uint8_t attribute_visibility_hidden ff_crop_tab[256 + 2 * MAX_NEG_CROP];
37 extern const uint8_t ff_zigzag_direct[64];
38 extern const uint8_t ff_zigzag_scan[16+1];
41 # include "arm/mathops.h"
43 # include "avr32/mathops.h"
45 # include "mips/mathops.h"
47 # include "ppc/mathops.h"
49 # include "x86/mathops.h"
52 /* generic implementation */
55 # define MUL64(a,b) ((int64_t)(a) * (int64_t)(b))
59 # define MULL(a,b,s) (MUL64(a, b) >> (s))
63 static av_always_inline int MULH(int a, int b){
64 return MUL64(a, b) >> 32;
69 static av_always_inline unsigned UMULH(unsigned a, unsigned b){
70 return ((uint64_t)(a) * (uint64_t)(b))>>32;
75 # define MAC64(d, a, b) ((d) += MUL64(a, b))
79 # define MLS64(d, a, b) ((d) -= MUL64(a, b))
82 /* signed 16x16 -> 32 multiply add accumulate */
84 # define MAC16(rt, ra, rb) rt += (ra) * (rb)
87 /* signed 16x16 -> 32 multiply */
89 # define MUL16(ra, rb) ((ra) * (rb))
93 # define MLS16(rt, ra, rb) ((rt) -= (ra) * (rb))
98 #define mid_pred mid_pred
99 static inline av_const int mid_pred(int a, int b, int c)
117 #define median4 median4
118 static inline av_const int median4(int a, int b, int c, int d)
121 if (c < d) return (FFMIN(b, d) + FFMAX(a, c)) / 2;
122 else return (FFMIN(b, c) + FFMAX(a, d)) / 2;
124 if (c < d) return (FFMIN(a, d) + FFMAX(b, c)) / 2;
125 else return (FFMIN(a, c) + FFMAX(b, d)) / 2;
130 #define FF_SIGNBIT(x) ((x) >> CHAR_BIT * sizeof(x) - 1)
133 static inline av_const int sign_extend(int val, unsigned bits)
135 unsigned shift = 8 * sizeof(int) - bits;
136 union { unsigned u; int s; } v = { (unsigned) val << shift };
141 #ifndef sign_extend64
142 static inline av_const int64_t sign_extend64(int64_t val, unsigned bits)
144 unsigned shift = 8 * sizeof(int64_t) - bits;
145 union { uint64_t u; int64_t s; } v = { (uint64_t) val << shift };
151 static inline av_const unsigned zero_extend(unsigned val, unsigned bits)
153 return (val << ((8 * sizeof(int)) - bits)) >> ((8 * sizeof(int)) - bits);
158 #define COPY3_IF_LT(x, y, a, b, c, d)\
167 #define MASK_ABS(mask, level) do { \
168 mask = level >> 31; \
169 level = (level ^ mask) - mask; \
174 # define NEG_SSR32(a,s) ((( int32_t)(a))>>(32-(s)))
178 # define NEG_USR32(a,s) (((uint32_t)(a))>>(32-(s)))
183 # define PACK_2U8(a,b) (((a) << 8) | (b))
186 # define PACK_4U8(a,b,c,d) (((a) << 24) | ((b) << 16) | ((c) << 8) | (d))
189 # define PACK_2U16(a,b) (((a) << 16) | (b))
193 # define PACK_2U8(a,b) (((b) << 8) | (a))
196 # define PACK_4U8(a,b,c,d) (((d) << 24) | ((c) << 16) | ((b) << 8) | (a))
199 # define PACK_2U16(a,b) (((b) << 16) | (a))
204 # define PACK_2S8(a,b) PACK_2U8((a)&255, (b)&255)
207 # define PACK_4S8(a,b,c,d) PACK_4U8((a)&255, (b)&255, (c)&255, (d)&255)
210 # define PACK_2S16(a,b) PACK_2U16((a)&0xffff, (b)&0xffff)
214 # define FASTDIV(a,b) ((uint32_t)((((uint64_t)a) * ff_inverse[b]) >> 32))
218 #define ff_sqrt ff_sqrt
219 static inline av_const unsigned int ff_sqrt(unsigned int a)
223 if (a < 255) return (ff_sqrt_tab[a + 1] - 1) >> 4;
224 else if (a < (1 << 12)) b = ff_sqrt_tab[a >> 4] >> 2;
226 else if (a < (1 << 14)) b = ff_sqrt_tab[a >> 6] >> 1;
227 else if (a < (1 << 16)) b = ff_sqrt_tab[a >> 8] ;
230 int s = av_log2_16bit(a >> 16) >> 1;
231 unsigned int c = a >> (s + 2);
232 b = ff_sqrt_tab[c >> (s + 8)];
233 b = FASTDIV(c,b) + (b << s);
236 return b - (a < b * b);
240 static inline av_const float ff_sqrf(float a)
245 static inline int8_t ff_u8_to_s8(uint8_t a)
255 #endif /* AVCODEC_MATHOPS_H */