From 2250d3a293d36ed9d8143d4c3d3e94086c429af4 Mon Sep 17 00:00:00 2001 From: Richard Henderson Date: Mon, 29 Aug 2016 11:46:19 -0700 Subject: [PATCH] cutils: Remove aarch64 buffer zero checking The revised integer version is 4 times faster than the neon version on an AppliedMicro Mustang. Even with hand scheduling and additional unrolling I cannot make any neon version run as fast as the integer. Signed-off-by: Richard Henderson Signed-off-by: Paolo Bonzini --- util/bufferiszero.c | 15 --------------- 1 file changed, 15 deletions(-) diff --git a/util/bufferiszero.c b/util/bufferiszero.c index 025cb8f..e6679b3 100644 --- a/util/bufferiszero.c +++ b/util/bufferiszero.c @@ -200,21 +200,6 @@ static bool select_accel_fn(const void *buf, size_t len) return buffer_zero_int(buf, len); } -#elif defined(__aarch64__) -#include "arm_neon.h" - -#define DO_NONZERO(X) (vgetq_lane_u64((X), 0) | vgetq_lane_u64((X), 1)) -ACCEL_BUFFER_ZERO(buffer_zero_neon, 128, uint64x2_t, DO_NONZERO) - -static bool select_accel_fn(const void *buf, size_t len) -{ - uintptr_t ibuf = (uintptr_t)buf; - if (len % 128 == 0 && ibuf % sizeof(uint64x2_t) == 0) { - return buffer_zero_neon(buf, len); - } - return buffer_zero_int(buf, len); -} - #else #define select_accel_fn buffer_zero_int #endif -- 2.7.4