aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorPaolo Bonzini <pbonzini@redhat.com>2016-09-13 17:04:52 +0200
committerPaolo Bonzini <pbonzini@redhat.com>2016-09-13 19:13:32 +0200
commit86444f084b23c967d556039b22a67d80a72725ca (patch)
tree4b9e7fd90f94fae7402111575c1dba62b581ca41
parentefad6682452ec85a898609c885c2721ea12585db (diff)
cutils: Add SSE4 version
Signed-off-by: Paolo Bonzini <pbonzini@redhat.com>
-rw-r--r--util/bufferiszero.c10
1 files changed, 10 insertions, 0 deletions
diff --git a/util/bufferiszero.c b/util/bufferiszero.c
index 4af3caa1b6..bafd3d159c 100644
--- a/util/bufferiszero.c
+++ b/util/bufferiszero.c
@@ -114,6 +114,13 @@ ACCEL_BUFFER_ZERO(buffer_zero_sse2, 64, __m128i, SSE2_NONZERO)
#ifdef CONFIG_AVX2_OPT
#pragma GCC push_options
+#pragma GCC target("sse4")
+#include <smmintrin.h>
+#define SSE4_NONZERO(X) !_mm_testz_si128((X), (X))
+ACCEL_BUFFER_ZERO(buffer_zero_sse4, 64, __m128i, SSE4_NONZERO)
+#pragma GCC pop_options
+
+#pragma GCC push_options
#pragma GCC target("avx2")
#include <immintrin.h>
#define AVX2_NONZERO(X) !_mm256_testz_si256((X), (X))
@@ -182,6 +189,9 @@ static bool select_accel_fn(const void *buf, size_t len)
if (len % 128 == 0 && ibuf % 32 == 0 && (cpuid_cache & CACHE_AVX2)) {
return buffer_zero_avx2(buf, len);
}
+ if (len % 64 == 0 && ibuf % 16 == 0 && (cpuid_cache & CACHE_SSE4)) {
+ return buffer_zero_sse4(buf, len);
+ }
#endif
if (len % 64 == 0 && ibuf % 16 == 0 && (cpuid_cache & CACHE_SSE2)) {
return buffer_zero_sse2(buf, len);