55#ifndef INCLUDED_volk_32fc_conjugate_32fc_u_H
56#define INCLUDED_volk_32fc_conjugate_32fc_u_H
68 unsigned int num_points)
70 unsigned int number = 0;
71 const unsigned int quarterPoints = num_points / 4;
77 __m256 conjugator = _mm256_setr_ps(0, -0.f, 0, -0.f, 0, -0.f, 0, -0.f);
79 for (; number < quarterPoints; number++) {
81 x = _mm256_loadu_ps((
float*)a);
83 x = _mm256_xor_ps(x, conjugator);
85 _mm256_storeu_ps((
float*)c, x);
91 number = quarterPoints * 4;
93 for (; number < num_points; number++) {
100#include <pmmintrin.h>
104 unsigned int num_points)
106 unsigned int number = 0;
107 const unsigned int halfPoints = num_points / 2;
113 __m128 conjugator = _mm_setr_ps(0, -0.f, 0, -0.f);
115 for (; number < halfPoints; number++) {
117 x = _mm_loadu_ps((
float*)a);
119 x = _mm_xor_ps(x, conjugator);
121 _mm_storeu_ps((
float*)c, x);
127 if ((num_points % 2) != 0) {
133#ifdef LV_HAVE_GENERIC
137 unsigned int num_points)
141 unsigned int number = 0;
143 for (number = 0; number < num_points; number++) {
151#ifndef INCLUDED_volk_32fc_conjugate_32fc_a_H
152#define INCLUDED_volk_32fc_conjugate_32fc_a_H
160#include <immintrin.h>
164 unsigned int num_points)
166 unsigned int number = 0;
167 const unsigned int quarterPoints = num_points / 4;
173 __m256 conjugator = _mm256_setr_ps(0, -0.f, 0, -0.f, 0, -0.f, 0, -0.f);
175 for (; number < quarterPoints; number++) {
177 x = _mm256_load_ps((
float*)a);
179 x = _mm256_xor_ps(x, conjugator);
181 _mm256_store_ps((
float*)c, x);
187 number = quarterPoints * 4;
189 for (; number < num_points; number++) {
196#include <pmmintrin.h>
200 unsigned int num_points)
202 unsigned int number = 0;
203 const unsigned int halfPoints = num_points / 2;
209 __m128 conjugator = _mm_setr_ps(0, -0.f, 0, -0.f);
211 for (; number < halfPoints; number++) {
213 x = _mm_load_ps((
float*)a);
215 x = _mm_xor_ps(x, conjugator);
217 _mm_store_ps((
float*)c, x);
223 if ((num_points % 2) != 0) {
234 unsigned int num_points)
237 const unsigned int quarterPoints = num_points / 4;
243 for (number = 0; number < quarterPoints; number++) {
245 x = vld2q_f32((
float*)a);
248 x.val[1] = vnegq_f32(x.val[1]);
250 vst2q_f32((
float*)c, x);
256 for (number = quarterPoints * 4; number < num_points; number++) {
static void volk_32fc_conjugate_32fc_a_avx(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:162
static void volk_32fc_conjugate_32fc_u_sse3(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:102
static void volk_32fc_conjugate_32fc_a_sse3(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:198
static void volk_32fc_conjugate_32fc_a_neon(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:232
static void volk_32fc_conjugate_32fc_u_avx(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:66
static void volk_32fc_conjugate_32fc_generic(lv_32fc_t *cVector, const lv_32fc_t *aVector, unsigned int num_points)
Definition: volk_32fc_conjugate_32fc.h:135
#define __VOLK_PREFETCH(addr)
Definition: volk_common.h:68
#define lv_conj(x)
Definition: volk_complex.h:100
float complex lv_32fc_t
Definition: volk_complex.h:74