#include <arm_neon.h>
-#if !defined(__ARMCC_VERSION) && !defined(FORCE_NO_NEON_INLINE_ASM)
-// [both armcc & gcc set __GNUC__]
-// Use GNU style inline asm on gcc, for best performance
-// Use intrinsics on armcc
-// This switch determines if any GNU style inline asm is allowed
-#define USE_NEON_INLINE_ASM
-#endif
-
-
static force_inline uint8x8x4_t unpack0565(uint16x8_t rgb)
{
uint16x8_t gb, b;
uint8_t *keep_dst;
-#ifndef USE_NEON_INLINE_ASM
+#ifndef USE_GCC_INLINE_ASM
uint8x8_t sval,dval,temp;
sval = vld1_u8((void*)src);
uint32_t *keep_dst;
-#ifndef USE_NEON_INLINE_ASM
+#ifndef USE_GCC_INLINE_ASM
uint8x8x4_t sval,dval,temp;
sval = vld4_u8((void*)src);
do {
while (w>=8)
{
-#ifndef USE_NEON_INLINE_ASM
+#ifndef USE_GCC_INLINE_ASM
vst1q_u16(dst, pack0565(vld4_u8((void*)src)));
#else
asm volatile (
uint32_t *keep_dst;
-#ifndef USE_NEON_INLINE_ASM
+#ifndef USE_GCC_INLINE_ASM
uint8x8x4_t sval,dval,temp;
sval = vld4_u8((void*)src);
maskLine += maskStride;
w = width;
-#ifndef USE_NEON_INLINE_ASM
+#ifndef USE_GCC_INLINE_ASM
uint8x8_t alpha;
uint16x8_t dval, temp;
uint8x8x4_t sval8temp;
w = width;
-#ifndef USE_NEON_INLINE_ASM
+#ifndef USE_GCC_INLINE_ASM
uint8x8_t alpha;
uint16x8_t dval, temp;
uint8x8x4_t sval8temp;
maskLine += maskStride;
w = width;
-#ifndef USE_NEON_INLINE_ASM
+#ifndef USE_GCC_INLINE_ASM
uint8x8_t alpha;
uint8x8x4_t dval, temp;