Compute Library: arm_compute/core/FixedPoint.inl Source File

 /*
  * Copyright (c) 2017-2018 ARM Limited.
  *
  * SPDX-License-Identifier: MIT
  *
  * Permission is hereby granted, free of charge, to any person obtaining a copy
  * of this software and associated documentation files (the "Software"), to
  * deal in the Software without restriction, including without limitation the
  * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
  * sell copies of the Software, and to permit persons to whom the Software is
  * furnished to do so, subject to the following conditions:
  *
  * The above copyright notice and this permission notice shall be included in all
  * copies or substantial portions of the Software.
  *
  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
  * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
  * SOFTWARE.
  */
 #include "arm_compute/core/Error.h"
 #include "arm_compute/core/utils/misc/Utility.h"

 #include <cmath>
 #include <limits>

 namespace arm_compute
 {
 inline qint8_t sqshl_qs8(qint8_t a, int shift)
 {
     qint16_t tmp = static_cast<qint16_t>(a) << shift;

     // Saturate the result in case of overflow and cast to qint8_t
     return utility::saturate_cast<qint8_t>(tmp);
 }

 inline qint16_t sqshl_qs16(qint16_t a, int shift)
 {
     qint32_t tmp = static_cast<qint32_t>(a) << shift;

     // Saturate the result in case of overflow and cast to qint16_t
     return utility::saturate_cast<qint16_t>(tmp);
 }

 inline qint8_t sshr_qs8(qint8_t a, int shift)
 {
     ARM_COMPUTE_ERROR_ON_MSG(shift == 0, "Shift should not be zero");
     const qint8_t round_val = 1 << (shift - 1);
     return sqadd_qs8(a, round_val) >> shift;
 }

 inline qint16_t sshr_qs16(qint16_t a, int shift)
 {
     ARM_COMPUTE_ERROR_ON_MSG(shift == 0, "Shift should not be zero");
     const qint16_t round_val = 1 << (shift - 1);
     return sqadd_qs16(a, round_val) >> shift;
 }

 inline qint8_t sabs_qs8(qint8_t a)
 {
     return (a < 0) ? (a == std::numeric_limits<int8_t>::min()) ? std::numeric_limits<int8_t>::max() : -a : a;
 }

 inline qint16_t sabs_qs16(qint16_t a)
 {
     return (a < 0) ? (a == std::numeric_limits<int16_t>::min()) ? std::numeric_limits<int16_t>::max() : -a : a;
 }

 inline qint8_t sadd_qs8(qint8_t a, qint8_t b)
 {
     return a + b;
 }

 inline qint16_t sadd_qs16(qint16_t a, qint16_t b)
 {
     return a + b;
 }

 inline qint8_t sqadd_qs8(qint8_t a, qint8_t b)
 {
     // We need to store the temporary result in qint16_t otherwise we cannot evaluate the overflow
     qint16_t tmp = (static_cast<qint16_t>(a) + static_cast<qint16_t>(b));

     // Saturate the result in case of overflow and cast to qint8_t
     return utility::saturate_cast<qint8_t>(tmp);
 }

 inline qint16_t sqadd_qs16(qint16_t a, qint16_t b)
 {
     // We need to store the temporary result in qint32_t otherwise we cannot evaluate the overflow
     qint32_t tmp = (static_cast<qint32_t>(a) + static_cast<qint32_t>(b));

     // Saturate the result in case of overflow and cast to qint16_t
     return utility::saturate_cast<qint16_t>(tmp);
 }

 inline qint32_t sqadd_qs32(qint32_t a, qint32_t b)
 {
     // We need to store the temporary result in qint64_t otherwise we cannot evaluate the overflow
     qint64_t tmp = (static_cast<qint64_t>(a) + static_cast<qint64_t>(b));

     // Saturate the result in case of overflow and cast to qint32_t
     return utility::saturate_cast<qint32_t>(tmp);
 }

 inline qint8_t ssub_qs8(qint8_t a, qint8_t b)
 {
     return a - b;
 }

 inline qint16_t ssub_qs16(qint16_t a, qint16_t b)
 {
     return a - b;
 }

 inline qint8_t sqsub_qs8(qint8_t a, qint8_t b)
 {
     // We need to store the temporary result in uint16_t otherwise we cannot evaluate the overflow
     qint16_t tmp = static_cast<qint16_t>(a) - static_cast<qint16_t>(b);

     // Saturate the result in case of overflow and cast to qint8_t
     return utility::saturate_cast<qint8_t>(tmp);
 }

 inline qint16_t sqsub_qs16(qint16_t a, qint16_t b)
 {
     // We need to store the temporary result in qint32_t otherwise we cannot evaluate the overflow
     qint32_t tmp = static_cast<qint32_t>(a) - static_cast<qint32_t>(b);

     // Saturate the result in case of overflow and cast to qint16_t
     return utility::saturate_cast<qint16_t>(tmp);
 }

 inline qint8_t smul_qs8(qint8_t a, qint8_t b, int fixed_point_position)
 {
     const qint16_t round_up_const = (1 << (fixed_point_position - 1));

     qint16_t tmp = static_cast<qint16_t>(a) * static_cast<qint16_t>(b);

     // Rounding up
     tmp += round_up_const;

     return static_cast<qint8_t>(tmp >> fixed_point_position);
 }

 inline qint16_t smul_qs16(qint16_t a, qint16_t b, int fixed_point_position)
 {
     const qint32_t round_up_const = (1 << (fixed_point_position - 1));

     qint32_t tmp = static_cast<qint32_t>(a) * static_cast<qint32_t>(b);

     // Rounding up
     tmp += round_up_const;

     return static_cast<qint16_t>(tmp >> fixed_point_position);
 }

 inline qint8_t sqmul_qs8(qint8_t a, qint8_t b, int fixed_point_position)
 {
     const qint16_t round_up_const = (1 << (fixed_point_position - 1));

     qint16_t tmp = static_cast<qint16_t>(a) * static_cast<qint16_t>(b);

     // Rounding up
     tmp += round_up_const;

     return utility::saturate_cast<qint8_t>(tmp >> fixed_point_position);
 }

 inline qint16_t sqmul_qs16(qint16_t a, qint16_t b, int fixed_point_position)
 {
     const qint32_t round_up_const = (1 << (fixed_point_position - 1));

     qint32_t tmp = static_cast<qint32_t>(a) * static_cast<qint32_t>(b);

     // Rounding up
     tmp += round_up_const;

     return utility::saturate_cast<qint16_t>(tmp >> fixed_point_position);
 }

 inline qint16_t sqmull_qs8(qint8_t a, qint8_t b, int fixed_point_position)
 {
     const qint16_t round_up_const = (1 << (fixed_point_position - 1));

     qint16_t tmp = static_cast<qint16_t>(a) * static_cast<qint16_t>(b);

     // Rounding up
     tmp += round_up_const;

     return tmp >> fixed_point_position;
 }

 inline qint32_t sqmull_qs16(qint16_t a, qint16_t b, int fixed_point_position)
 {
     const qint32_t round_up_const = (1 << (fixed_point_position - 1));

     qint32_t tmp = static_cast<qint32_t>(a) * static_cast<qint32_t>(b);

     // Rounding up
     tmp += round_up_const;

     return tmp >> fixed_point_position;
 }

 inline qint8_t sinvsqrt_qs8(qint8_t a, int fixed_point_position)
 {
     const qint8_t shift = 8 - (fixed_point_position + (__builtin_clz(a) - 24));

     const qint8_t const_three = (3 << fixed_point_position);
     qint8_t       temp        = shift < 0 ? (a << -shift) : (a >> shift);
     qint8_t       x2          = temp;

     // We need three iterations to find the result
     for(int i = 0; i < 3; ++i)
     {
         qint8_t three_minus_dx = ssub_qs8(const_three, smul_qs8(temp, smul_qs8(x2, x2, fixed_point_position), fixed_point_position));
         x2                     = (smul_qs8(x2, three_minus_dx, fixed_point_position) >> 1);
     }

     temp = shift < 0 ? (x2 << (-shift >> 1)) : (x2 >> (shift >> 1));

     return temp;
 }

 inline qint16_t sinvsqrt_qs16(qint16_t a, int fixed_point_position)
 {
     const qint16_t shift = 16 - (fixed_point_position + (__builtin_clz(a) - 16));

     const qint16_t const_three = (3 << fixed_point_position);
     qint16_t       temp        = shift < 0 ? (a << -shift) : (a >> shift);
     qint16_t       x2          = temp;

     // We need three iterations to find the result
     for(int i = 0; i < 3; ++i)
     {
         qint16_t three_minus_dx = ssub_qs16(const_three, smul_qs16(temp, smul_qs16(x2, x2, fixed_point_position), fixed_point_position));
         x2                      = smul_qs16(x2, three_minus_dx, fixed_point_position) >> 1;
     }

     temp = shift < 0 ? (x2 << ((-shift) >> 1)) : (x2 >> (shift >> 1));

     return temp;
 }

 inline qint8_t sdiv_qs8(qint8_t a, qint8_t b, int fixed_point_position)
 {
     const qint16_t temp = a << fixed_point_position;
     return static_cast<qint8_t>(temp / b);
 }

 inline qint16_t sdiv_qs16(qint16_t a, qint16_t b, int fixed_point_position)
 {
     const qint32_t temp = a << fixed_point_position;
     return static_cast<qint16_t>(temp / b);
 }

 inline qint8_t sqexp_qs8(qint8_t a, int fixed_point_position)
 {
     // Constants
     const qint8_t const_one = (1 << fixed_point_position);
     const qint8_t ln2       = ((0x58 >> (6 - fixed_point_position)) + 1) >> 1;
     const qint8_t inv_ln2   = (((0x38 >> (6 - fixed_point_position)) + 1) >> 1) | const_one;
     const qint8_t A         = ((0x7F >> (6 - fixed_point_position)) + 1) >> 1;
     const qint8_t B         = ((0x3F >> (6 - fixed_point_position)) + 1) >> 1;
     const qint8_t C         = ((0x16 >> (6 - fixed_point_position)) + 1) >> 1;
     const qint8_t D         = ((0x05 >> (6 - fixed_point_position)) + 1) >> 1;

     // Polynomial expansion
     const int     dec_a = (sqmul_qs8(a, inv_ln2, fixed_point_position) >> fixed_point_position);
     const qint8_t alpha = sabs_qs8(sqsub_qs8(a, sqmul_qs8(ln2, sqshl_qs8(dec_a, fixed_point_position), fixed_point_position)));
     qint8_t       sum   = sqadd_qs8(sqmul_qs8(alpha, D, fixed_point_position), C);
     sum                 = sqadd_qs8(sqmul_qs8(alpha, sum, fixed_point_position), B);
     sum                 = sqadd_qs8(sqmul_qs8(alpha, sum, fixed_point_position), A);
     sum                 = sqmul_qs8(alpha, sum, fixed_point_position);
     sum                 = sqadd_qs8(sum, const_one);

     return (dec_a < 0) ? (sum >> -dec_a) : sqshl_qs8(sum, dec_a);
 }

 inline qint16_t sqexp_qs16(qint16_t a, int fixed_point_position)
 {
     // Constants
     const qint16_t const_one = (1 << fixed_point_position);
     const qint16_t ln2       = ((0x58B9 >> (14 - fixed_point_position)) + 1) >> 1;
     const qint16_t inv_ln2   = (((0x38AA >> (14 - fixed_point_position)) + 1) >> 1) | const_one;
     const qint16_t A         = ((0x7FBA >> (14 - fixed_point_position)) + 1) >> 1;
     const qint16_t B         = ((0x3FE9 >> (14 - fixed_point_position)) + 1) >> 1;
     const qint16_t C         = ((0x1693 >> (14 - fixed_point_position)) + 1) >> 1;
     const qint16_t D         = ((0x0592 >> (14 - fixed_point_position)) + 1) >> 1;

     // Polynomial expansion
     const int      dec_a = (sqmul_qs16(a, inv_ln2, fixed_point_position) >> fixed_point_position);
     const qint16_t alpha = sabs_qs16(sqsub_qs16(a, sqmul_qs16(ln2, sqshl_qs16(dec_a, fixed_point_position), fixed_point_position)));
     qint16_t       sum   = sqadd_qs16(sqmul_qs16(alpha, D, fixed_point_position), C);
     sum                  = sqadd_qs16(sqmul_qs16(alpha, sum, fixed_point_position), B);
     sum                  = sqadd_qs16(sqmul_qs16(alpha, sum, fixed_point_position), A);
     sum                  = sqmul_qs16(alpha, sum, fixed_point_position);
     sum                  = sqadd_qs16(sum, const_one);

     return (dec_a < 0) ? (sum >> -dec_a) : sqshl_qs16(sum, dec_a);
 }

 inline qint8_t slog_qs8(qint8_t a, int fixed_point_position)
 {
     // Constants
     qint8_t const_one = (1 << fixed_point_position);
     qint8_t ln2       = (0x58 >> (7 - fixed_point_position));
     qint8_t A         = (0x5C >> (7 - fixed_point_position - 1));
     qint8_t B         = -(0x56 >> (7 - fixed_point_position));
     qint8_t C         = (0x29 >> (7 - fixed_point_position));
     qint8_t D         = -(0x0A >> (7 - fixed_point_position));

     if((const_one == a) || (a < 0))
     {
         return 0;
     }
     else if(a < const_one)
     {
         return -slog_qs8(sdiv_qs8(const_one, a, fixed_point_position), fixed_point_position);
     }

     // Remove even powers of 2
     qint8_t shift_val = 31 - __builtin_clz(a >> fixed_point_position);
     a >>= shift_val;
     a = ssub_qs8(a, const_one);

     // Polynomial expansion
     qint8_t sum = sqadd_qs8(sqmul_qs8(a, D, fixed_point_position), C);
     sum         = sqadd_qs8(sqmul_qs8(a, sum, fixed_point_position), B);
     sum         = sqadd_qs8(sqmul_qs8(a, sum, fixed_point_position), A);
     sum         = sqmul_qs8(a, sum, fixed_point_position);

     return smul_qs8(sadd_qs8(sum, shift_val << fixed_point_position), ln2, fixed_point_position);
 }

 inline qint16_t slog_qs16(qint16_t a, int fixed_point_position)
 {
     // Constants
     qint16_t const_one = (1 << fixed_point_position);
     qint16_t ln2       = (0x58B9 >> (7 - fixed_point_position));
     qint16_t A         = (0x5C0F >> (7 - fixed_point_position - 1));
     qint16_t B         = -(0x56AE >> (7 - fixed_point_position));
     qint16_t C         = (0x2933 >> (7 - fixed_point_position));
     qint16_t D         = -(0x0AA7 >> (7 - fixed_point_position));

     if((const_one == a) || (a < 0))
     {
         return 0;
     }
     else if(a < const_one)
     {
         return -slog_qs16(sdiv_qs16(const_one, a, fixed_point_position), fixed_point_position);
     }

     // Remove even powers of 2
     qint16_t shift_val = 31 - __builtin_clz(a >> fixed_point_position);
     a >>= shift_val;
     a = ssub_qs16(a, const_one);

     // Polynomial expansion
     qint16_t sum = sqadd_qs16(sqmul_qs16(a, D, fixed_point_position), C);
     sum          = sqadd_qs16(sqmul_qs16(a, sum, fixed_point_position), B);
     sum          = sqadd_qs16(sqmul_qs16(a, sum, fixed_point_position), A);
     sum          = sqmul_qs16(a, sum, fixed_point_position);

     return smul_qs16(sadd_qs16(sum, shift_val << fixed_point_position), ln2, fixed_point_position);
 }

 inline float scvt_f32_qs8(qint8_t a, int fixed_point_position)
 {
     return static_cast<float>(a) / (1 << fixed_point_position);
 }

 inline qint8_t sqcvt_qs8_f32(float a, int fixed_point_position)
 {
     // round_nearest_integer(a * 2^(fixed_point_position))
     return utility::saturate_cast<qint8_t>(a * (1 << fixed_point_position) + ((a >= 0) ? 0.5 : -0.5));
 }

 inline float scvt_f32_qs16(qint16_t a, int fixed_point_position)
 {
     return static_cast<float>(a) / (1 << fixed_point_position);
 }

 inline qint16_t sqcvt_qs16_f32(float a, int fixed_point_position)
 {
     // round_nearest_integer(a * 2^(fixed_point_position))
     return utility::saturate_cast<qint16_t>(a * (1 << fixed_point_position) + ((a >= 0) ? 0.5 : -0.5));
 }

 inline qint8_t sqmovn_qs16(qint16_t a)
 {
     // Saturate the result in case of overflow and cast to qint8_t
     return utility::saturate_cast<qint8_t>(a);
 }

 inline qint16_t sqmovn_qs32(qint32_t a)
 {
     // Saturate the result in case of overflow and cast to qint16_t
     return utility::saturate_cast<qint16_t>(a);
 }
 }
arm_compute::Channel::A
Alpha channel.

arm_compute::test::fixed_point_arithmetic::detail::min
fixed_point< T > min(fixed_point< T > x, fixed_point< T > y)
Definition: FixedPoint.h:897

arm_compute::qint64_t
int64_t qint64_t
64 bit fixed point scalar value
Definition: FixedPoint.h:32

arm_compute::sabs_qs16
qint16_t sabs_qs16(qint16_t a)
16 bit fixed point scalar absolute value
Definition: FixedPoint.inl:67

arm_compute::smul_qs8
qint8_t smul_qs8(qint8_t a, qint8_t b, int fixed_point_position)
8 bit fixed point scalar multiply
Definition: FixedPoint.inl:137

arm_compute::ssub_qs8
qint8_t ssub_qs8(qint8_t a, qint8_t b)
8 bit fixed point scalar subtraction
Definition: FixedPoint.inl:109

arm_compute::scvt_f32_qs16
float scvt_f32_qs16(qint16_t a, int fixed_point_position)
Convert a 16 bit fixed point to float.
Definition: FixedPoint.inl:384

arm_compute::test::validation::a
CLTensor a
Definition: GEMM.cpp:121

arm_compute::sdiv_qs16
qint16_t sdiv_qs16(qint16_t a, qint16_t b, int fixed_point_position)
16 bit fixed point scalar division
Definition: FixedPoint.inl:255

arm_compute::Channel::B
Blue channel.

arm_compute::scvt_f32_qs8
float scvt_f32_qs8(qint8_t a, int fixed_point_position)
Convert an 8 bit fixed point to float.
Definition: FixedPoint.inl:373

sum
DATA_TYPE sum(__global const DATA_TYPE *input)
Calculate sum of a vector.
Definition: reduction_operation.cl:52

arm_compute::sqexp_qs16
qint16_t sqexp_qs16(qint16_t a, int fixed_point_position)
16 bit fixed point scalar exponential
Definition: FixedPoint.inl:284

arm_compute::utility::saturate_cast
T saturate_cast(U val)
Type cast with saturation.
Definition: Utility.h:140

arm_compute::sqadd_qs32
qint32_t sqadd_qs32(qint32_t a, qint32_t b)
32 bit fixed point scalar saturating add
Definition: FixedPoint.inl:100

arm_compute::sqshl_qs16
qint16_t sqshl_qs16(qint16_t a, int shift)
16 bit fixed point scalar saturating shift left
Definition: FixedPoint.inl:40

arm_compute
This file contains all available output stages for GEMMLowp on OpenCL.
Definition: 00_introduction.dox:1

arm_compute::sqmovn_qs32
qint16_t sqmovn_qs32(qint32_t a)
Scalar saturating move and narrow.
Definition: FixedPoint.inl:401

arm_compute::slog_qs16
qint16_t slog_qs16(qint16_t a, int fixed_point_position)
16 bit fixed point scalar logarithm
Definition: FixedPoint.inl:340

arm_compute::sqmull_qs16
qint32_t sqmull_qs16(qint16_t a, qint16_t b, int fixed_point_position)
16 bit fixed point scalar multiply long
Definition: FixedPoint.inl:197

arm_compute::sadd_qs8
qint8_t sadd_qs8(qint8_t a, qint8_t b)
8 bit fixed point scalar add
Definition: FixedPoint.inl:72

arm_compute::sdiv_qs8
qint8_t sdiv_qs8(qint8_t a, qint8_t b, int fixed_point_position)
8 bit fixed point scalar division
Definition: FixedPoint.inl:249

arm_compute::smul_qs16
qint16_t smul_qs16(qint16_t a, qint16_t b, int fixed_point_position)
16 bit fixed point scalar multiply
Definition: FixedPoint.inl:149

arm_compute::sqshl_qs8
qint8_t sqshl_qs8(qint8_t a, int shift)
8 bit fixed point scalar saturating shift left
Definition: FixedPoint.inl:32

arm_compute::qint32_t
int32_t qint32_t
32 bit fixed point scalar value
Definition: FixedPoint.h:31

arm_compute::qint16_t
int16_t qint16_t
16 bit fixed point scalar value
Definition: FixedPoint.h:30

arm_compute::sqcvt_qs16_f32
qint16_t sqcvt_qs16_f32(float a, int fixed_point_position)
Convert a float to 16 bit fixed point.
Definition: FixedPoint.inl:389

Error.h

arm_compute::sqadd_qs16
qint16_t sqadd_qs16(qint16_t a, qint16_t b)
16 bit fixed point scalar saturating add
Definition: FixedPoint.inl:91

arm_compute::sqsub_qs8
qint8_t sqsub_qs8(qint8_t a, qint8_t b)
8 bit fixed point scalar saturating subtraction
Definition: FixedPoint.inl:119

arm_compute::sinvsqrt_qs16
qint16_t sinvsqrt_qs16(qint16_t a, int fixed_point_position)
16 bit fixed point scalar inverse square root
Definition: FixedPoint.inl:229

arm_compute::sqmull_qs8
qint16_t sqmull_qs8(qint8_t a, qint8_t b, int fixed_point_position)
8 bit fixed point scalar multiply long
Definition: FixedPoint.inl:185

arm_compute::sqmovn_qs16
qint8_t sqmovn_qs16(qint16_t a)
Scalar saturating move and narrow.
Definition: FixedPoint.inl:395

arm_compute::sqmul_qs8
qint8_t sqmul_qs8(qint8_t a, qint8_t b, int fixed_point_position)
8 bit fixed point scalar saturating multiply
Definition: FixedPoint.inl:161

arm_compute::slog_qs8
qint8_t slog_qs8(qint8_t a, int fixed_point_position)
8 bit fixed point scalar logarithm
Definition: FixedPoint.inl:307

arm_compute::sqexp_qs8
qint8_t sqexp_qs8(qint8_t a, int fixed_point_position)
8 bit fixed point scalar exponential
Definition: FixedPoint.inl:261

arm_compute::qint8_t
int8_t qint8_t
8 bit fixed point scalar value
Definition: FixedPoint.h:29

arm_compute::ssub_qs16
qint16_t ssub_qs16(qint16_t a, qint16_t b)
16 bit fixed point scalar subtraction
Definition: FixedPoint.inl:114

arm_compute::sshr_qs8
qint8_t sshr_qs8(qint8_t a, int shift)
8 bit fixed point scalar shift right
Definition: FixedPoint.inl:48

arm_compute::sshr_qs16
qint16_t sshr_qs16(qint16_t a, int shift)
16 bit fixed point scalar shift right
Definition: FixedPoint.inl:55

arm_compute::sinvsqrt_qs8
qint8_t sinvsqrt_qs8(qint8_t a, int fixed_point_position)
8 bit fixed point scalar inverse square root
Definition: FixedPoint.inl:209

arm_compute::sqsub_qs16
qint16_t sqsub_qs16(qint16_t a, qint16_t b)
16 bit fixed point scalar saturating subtraction
Definition: FixedPoint.inl:128

arm_compute::test::fixed_point_arithmetic::detail::max
fixed_point< T > max(fixed_point< T > x, fixed_point< T > y)
Definition: FixedPoint.h:902

arm_compute::test::validation::alpha
alpha
Definition: GEMM.cpp:115

arm_compute::sabs_qs8
qint8_t sabs_qs8(qint8_t a)
8 bit fixed point scalar absolute value
Definition: FixedPoint.inl:62

arm_compute::sadd_qs16
qint16_t sadd_qs16(qint16_t a, qint16_t b)
16 bit fixed point scalar add
Definition: FixedPoint.inl:77

arm_compute::test::validation::b
CLTensor b
Definition: GEMM.cpp:122

Utility.h

arm_compute::sqcvt_qs8_f32
qint8_t sqcvt_qs8_f32(float a, int fixed_point_position)
Convert a float to 8 bit fixed point.
Definition: FixedPoint.inl:378

arm_compute::sqadd_qs8
qint8_t sqadd_qs8(qint8_t a, qint8_t b)
8 bit fixed point scalar saturating add
Definition: FixedPoint.inl:82

ARM_COMPUTE_ERROR_ON_MSG
#define ARM_COMPUTE_ERROR_ON_MSG(cond,...)
Definition: Error.h:319

arm_compute::sqmul_qs16
qint16_t sqmul_qs16(qint16_t a, qint16_t b, int fixed_point_position)
16 bit fixed point scalar saturating multiply
Definition: FixedPoint.inl:173