vqtbl2_s8 (int8x16x2_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_oi __o;
- __o = __builtin_aarch64_set_qregoiv16qi (__o, __tab.val[0], 0);
- __o = __builtin_aarch64_set_qregoiv16qi (__o, __tab.val[1], 1);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return __builtin_aarch64_qtbl2v8qi (__o, (int8x8_t)__idx);
}
vqtbl2_u8 (uint8x16x2_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_oi __o;
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[1], 1);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (uint8x8_t)__builtin_aarch64_qtbl2v8qi (__o, (int8x8_t)__idx);
}
vqtbl2_p8 (poly8x16x2_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_oi __o;
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[1], 1);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (poly8x8_t)__builtin_aarch64_qtbl2v8qi (__o, (int8x8_t)__idx);
}
vqtbl2q_s8 (int8x16x2_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_oi __o;
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[1], 1);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return __builtin_aarch64_qtbl2v16qi (__o, (int8x16_t)__idx);
}
vqtbl2q_u8 (uint8x16x2_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_oi __o;
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[1], 1);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (uint8x16_t)__builtin_aarch64_qtbl2v16qi (__o, (int8x16_t)__idx);
}
vqtbl2q_p8 (poly8x16x2_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_oi __o;
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregoiv16qi (__o, (int8x16_t)__tab.val[1], 1);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (poly8x16_t)__builtin_aarch64_qtbl2v16qi (__o, (int8x16_t)__idx);
}
vqtbl3_s8 (int8x16x3_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_ci __o;
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[2], 2);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return __builtin_aarch64_qtbl3v8qi (__o, (int8x8_t)__idx);
}
vqtbl3_u8 (uint8x16x3_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_ci __o;
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[2], 2);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (uint8x8_t)__builtin_aarch64_qtbl3v8qi (__o, (int8x8_t)__idx);
}
vqtbl3_p8 (poly8x16x3_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_ci __o;
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[2], 2);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (poly8x8_t)__builtin_aarch64_qtbl3v8qi (__o, (int8x8_t)__idx);
}
vqtbl3q_s8 (int8x16x3_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_ci __o;
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[2], 2);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return __builtin_aarch64_qtbl3v16qi (__o, (int8x16_t)__idx);
}
vqtbl3q_u8 (uint8x16x3_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_ci __o;
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[2], 2);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (uint8x16_t)__builtin_aarch64_qtbl3v16qi (__o, (int8x16_t)__idx);
}
vqtbl3q_p8 (poly8x16x3_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_ci __o;
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregciv16qi (__o, (int8x16_t)__tab.val[2], 2);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (poly8x16_t)__builtin_aarch64_qtbl3v16qi (__o, (int8x16_t)__idx);
}
vqtbl4_s8 (int8x16x4_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_xi __o;
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[2], 2);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[3], 3);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return __builtin_aarch64_qtbl4v8qi (__o, (int8x8_t)__idx);
}
vqtbl4_u8 (uint8x16x4_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_xi __o;
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[2], 2);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[3], 3);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (uint8x8_t)__builtin_aarch64_qtbl4v8qi (__o, (int8x8_t)__idx);
}
vqtbl4_p8 (poly8x16x4_t __tab, uint8x8_t __idx)
{
__builtin_aarch64_simd_xi __o;
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[2], 2);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[3], 3);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (poly8x8_t)__builtin_aarch64_qtbl4v8qi (__o, (int8x8_t)__idx);
}
vqtbl4q_s8 (int8x16x4_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_xi __o;
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[2], 2);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[3], 3);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return __builtin_aarch64_qtbl4v16qi (__o, (int8x16_t)__idx);
}
vqtbl4q_u8 (uint8x16x4_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_xi __o;
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[2], 2);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[3], 3);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (uint8x16_t)__builtin_aarch64_qtbl4v16qi (__o, (int8x16_t)__idx);
}
vqtbl4q_p8 (poly8x16x4_t __tab, uint8x16_t __idx)
{
__builtin_aarch64_simd_xi __o;
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[0], 0);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[1], 1);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[2], 2);
- __o = __builtin_aarch64_set_qregxiv16qi (__o, (int8x16_t)__tab.val[3], 3);
+ __builtin_memcpy (&__o, &__tab, sizeof (__tab));
return (poly8x16_t)__builtin_aarch64_qtbl4v16qi (__o, (int8x16_t)__idx);
}
--- /dev/null
+/* { dg-do compile } */
+/* { dg-options "-O3" } */
+
+#include <arm_neon.h>
+
+#define TEST_TBL(name, rettype, tbltype, idxtype, ts) \
+ rettype test_ ## name ## _ ## ts (tbltype a, idxtype b) \
+ { \
+ return name ## _ ## ts (a, b); \
+ }
+
+TEST_TBL (vqtbl2, int8x8_t, int8x16x2_t, uint8x8_t, s8)
+TEST_TBL (vqtbl2, uint8x8_t, uint8x16x2_t, uint8x8_t, u8)
+TEST_TBL (vqtbl2, poly8x8_t, poly8x16x2_t, uint8x8_t, p8)
+
+TEST_TBL (vqtbl2q, int8x16_t, int8x16x2_t, uint8x16_t, s8)
+TEST_TBL (vqtbl2q, uint8x16_t, uint8x16x2_t, uint8x16_t, u8)
+TEST_TBL (vqtbl2q, poly8x16_t, poly8x16x2_t, uint8x16_t, p8)
+
+TEST_TBL (vqtbl4, int8x8_t, int8x16x4_t, uint8x8_t, s8)
+TEST_TBL (vqtbl4, uint8x8_t, uint8x16x4_t, uint8x8_t, u8)
+TEST_TBL (vqtbl4, poly8x8_t, poly8x16x4_t, uint8x8_t, p8)
+
+TEST_TBL (vqtbl4q, int8x16_t, int8x16x4_t, uint8x16_t, s8)
+TEST_TBL (vqtbl4q, uint8x16_t, uint8x16x4_t, uint8x16_t, u8)
+TEST_TBL (vqtbl4q, poly8x16_t, poly8x16x4_t, uint8x16_t, p8)
+
+#define TEST_TBL3(name, rettype, tbltype, idxtype, ts) \
+ rettype test_ ## name ## _ ## ts (idxtype a, tbltype b) \
+ { \
+ return name ## _ ## ts (b, a); \
+ }
+
+TEST_TBL3 (vqtbl3, int8x8_t, int8x16x3_t, uint8x8_t, s8)
+TEST_TBL3 (vqtbl3, uint8x8_t, uint8x16x3_t, uint8x8_t, u8)
+TEST_TBL3 (vqtbl3, poly8x8_t, poly8x16x3_t, uint8x8_t, p8)
+
+TEST_TBL3 (vqtbl3q, int8x16_t, int8x16x3_t, uint8x16_t, s8)
+TEST_TBL3 (vqtbl3q, uint8x16_t, uint8x16x3_t, uint8x16_t, u8)
+TEST_TBL3 (vqtbl3q, poly8x16_t, poly8x16x3_t, uint8x16_t, p8)
+
+/* { dg-final { scan-assembler-not "mov\\t" } } */
+
+/* { dg-final { scan-assembler-times "tbl\\t" 18} } */