From: Johannes Demel Date: Tue, 17 Mar 2020 20:20:51 +0000 (+0100) Subject: [PATCH 2/7] exp: Rename SSE4.1 to SSE2 kernel X-Git-Tag: archive/raspbian/2.2.1-2+rpi1^2~10 X-Git-Url: https://dgit.raspbian.org/?a=commitdiff_plain;h=20287c9b7d67b25bfb58de0a1654b8d95522a9ad;p=volk.git [PATCH 2/7] exp: Rename SSE4.1 to SSE2 kernel The SSE kernel only requires SSE2 instructions. Thus, we can just use this instruction level. Gbp-Pq: Name 0002-exp-Rename-SSE4.1-to-SSE2-kernel.patch --- diff --git a/kernels/volk/volk_32f_exp_32f.h b/kernels/volk/volk_32f_exp_32f.h index 19c3d9d..26fdf02 100644 --- a/kernels/volk/volk_32f_exp_32f.h +++ b/kernels/volk/volk_32f_exp_32f.h @@ -99,11 +99,11 @@ #ifndef INCLUDED_volk_32f_exp_32f_a_H #define INCLUDED_volk_32f_exp_32f_a_H -#ifdef LV_HAVE_SSE4_1 -#include +#ifdef LV_HAVE_SSE2 +#include static inline void -volk_32f_exp_32f_a_sse4_1(float* bVector, const float* aVector, unsigned int num_points) +volk_32f_exp_32f_a_sse2(float* bVector, const float* aVector, unsigned int num_points) { float* bPtr = bVector; const float* aPtr = aVector; @@ -175,7 +175,7 @@ volk_32f_exp_32f_a_sse4_1(float* bVector, const float* aVector, unsigned int num } } -#endif /* LV_HAVE_SSE4_1 for aligned */ +#endif /* LV_HAVE_SSE2 for aligned */ #ifdef LV_HAVE_GENERIC @@ -199,11 +199,11 @@ volk_32f_exp_32f_a_generic(float* bVector, const float* aVector, unsigned int nu #ifndef INCLUDED_volk_32f_exp_32f_u_H #define INCLUDED_volk_32f_exp_32f_u_H -#ifdef LV_HAVE_SSE4_1 -#include +#ifdef LV_HAVE_SSE2 +#include static inline void -volk_32f_exp_32f_u_sse4_1(float* bVector, const float* aVector, unsigned int num_points) +volk_32f_exp_32f_u_sse2(float* bVector, const float* aVector, unsigned int num_points) { float* bPtr = bVector; const float* aPtr = aVector; @@ -276,7 +276,7 @@ volk_32f_exp_32f_u_sse4_1(float* bVector, const float* aVector, unsigned int num } } -#endif /* LV_HAVE_SSE4_1 for unaligned */ +#endif /* LV_HAVE_SSE2 for unaligned */ #ifdef LV_HAVE_GENERIC