55 #ifndef INCLUDED_volk_32fc_conjugate_32fc_u_H
56 #define INCLUDED_volk_32fc_conjugate_32fc_u_H
64 #include <immintrin.h>
68 unsigned int num_points)
70 unsigned int number = 0;
71 const unsigned int quarterPoints = num_points / 4;
77 __m256 conjugator = _mm256_setr_ps(0, -0.f, 0, -0.f, 0, -0.f, 0, -0.f);
79 for (; number < quarterPoints; number++) {
81 x = _mm256_loadu_ps((
float*)a);
83 x = _mm256_xor_ps(x, conjugator);
85 _mm256_storeu_ps((
float*)c, x);
91 number = quarterPoints * 4;
93 for (; number < num_points; number++) {
100 #include <pmmintrin.h>
104 unsigned int num_points)
106 unsigned int number = 0;
107 const unsigned int halfPoints = num_points / 2;
115 for (; number < halfPoints; number++) {
127 if ((num_points % 2) != 0) {
133 #ifdef LV_HAVE_GENERIC
137 unsigned int num_points)
141 unsigned int number = 0;
143 for (number = 0; number < num_points; number++) {
151 #ifndef INCLUDED_volk_32fc_conjugate_32fc_a_H
152 #define INCLUDED_volk_32fc_conjugate_32fc_a_H
155 #include <inttypes.h>
160 #include <immintrin.h>
164 unsigned int num_points)
166 unsigned int number = 0;
167 const unsigned int quarterPoints = num_points / 4;
173 __m256 conjugator = _mm256_setr_ps(0, -0.f, 0, -0.f, 0, -0.f, 0, -0.f);
175 for (; number < quarterPoints; number++) {
177 x = _mm256_load_ps((
float*)a);
179 x = _mm256_xor_ps(x, conjugator);
181 _mm256_store_ps((
float*)c, x);
187 number = quarterPoints * 4;
189 for (; number < num_points; number++) {
196 #include <pmmintrin.h>
200 unsigned int num_points)
202 unsigned int number = 0;
203 const unsigned int halfPoints = num_points / 2;
211 for (; number < halfPoints; number++) {
223 if ((num_points % 2) != 0) {
230 #include <arm_neon.h>
234 unsigned int num_points)
237 const unsigned int quarterPoints = num_points / 4;
243 for (number = 0; number < quarterPoints; number++) {
245 x = vld2q_f32((
float*)a);
248 x.val[1] = vnegq_f32(x.val[1]);
250 vst2q_f32((
float*)c, x);
256 for (number = quarterPoints * 4; number < num_points; number++) {
263 #ifdef LV_HAVE_GENERIC
267 unsigned int num_points)
271 unsigned int number = 0;
273 for (number = 0; number < num_points; number++) {
FORCE_INLINE __m128 _mm_xor_ps(__m128 a, __m128 b)
Definition: sse2neon.h:2958
float32x4_t __m128
Definition: sse2neon.h:235
FORCE_INLINE __m128 _mm_setr_ps(float w, float z, float y, float x)
Definition: sse2neon.h:2523
FORCE_INLINE void _mm_storeu_ps(float *p, __m128 a)
Definition: sse2neon.h:2787
FORCE_INLINE __m128 _mm_loadu_ps(const float *p)
Definition: sse2neon.h:1941
FORCE_INLINE __m128 _mm_load_ps(const float *p)
Definition: sse2neon.h:1858
FORCE_INLINE void _mm_store_ps(float *p, __m128 a)
Definition: sse2neon.h:2704
static void volk_32fc_conjugate_32fc_a_avx(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:162
static void volk_32fc_conjugate_32fc_u_sse3(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:102
static void volk_32fc_conjugate_32fc_a_sse3(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:198
static void volk_32fc_conjugate_32fc_a_neon(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:232
static void volk_32fc_conjugate_32fc_u_avx(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:66
static void volk_32fc_conjugate_32fc_a_generic(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:265
static void volk_32fc_conjugate_32fc_generic(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:135
#define __VOLK_PREFETCH(addr)
Definition: volk_common.h:71
#define lv_conj(x)
Definition: volk_complex.h:100
float complex lv_32fc_t
Definition: volk_complex.h:74