40#ifndef INCLUDED_volk_16i_max_star_16i_a_H
41#define INCLUDED_volk_16i_max_star_16i_a_H
55 const unsigned int num_bytes = num_points * 2;
57 short candidate = src0[0];
59 __m128i xmm0, xmm1, xmm3, xmm4, xmm5, xmm6;
65 int bound = num_bytes >> 4;
66 int leftovers = (num_bytes >> 1) & 7;
76 for (
i = 0;
i < bound; ++
i) {
95 for (
i = 0;
i < 8; ++
i) {
96 candidate = ((short)(candidate - cands[
i]) > 0) ? candidate : cands[
i];
99 for (
i = 0;
i < leftovers; ++
i) {
100 candidate = ((short)(candidate - src0[(bound << 3) +
i]) > 0)
102 : src0[(bound << 3) +
i];
105 target[0] = candidate;
110#ifdef LV_HAVE_GENERIC
115 const unsigned int num_bytes = num_points * 2;
119 int bound = num_bytes >> 1;
121 short candidate = src0[0];
122 for (
i = 1;
i < bound; ++
i) {
123 candidate = ((short)(candidate - src0[
i]) > 0) ? candidate : src0[
i];
125 target[0] = candidate;
FORCE_INLINE void _mm_store_si128(__m128i *p, __m128i a)
Definition: sse2neon.h:5937
FORCE_INLINE __m128i _mm_cmpeq_epi16(__m128i a, __m128i b)
Definition: sse2neon.h:3267
FORCE_INLINE __m128i _mm_setzero_si128()
Definition: sse2neon.h:5339
FORCE_INLINE __m128i _mm_and_si128(__m128i, __m128i)
Definition: sse2neon.h:3128
FORCE_INLINE __m128i _mm_add_epi16(__m128i a, __m128i b)
Definition: sse2neon.h:2969
FORCE_INLINE __m128i _mm_shuffle_epi8(__m128i a, __m128i b)
Definition: sse2neon.h:7069
FORCE_INLINE __m128i _mm_xor_si128(__m128i a, __m128i b)
Definition: sse2neon.h:6458
FORCE_INLINE __m128i _mm_load_si128(const __m128i *p)
Definition: sse2neon.h:4471
FORCE_INLINE __m128i _mm_cmpgt_epi16(__m128i a, __m128i b)
Definition: sse2neon.h:3367
int64x2_t __m128i
Definition: sse2neon.h:244
static void volk_16i_max_star_16i_a_ssse3(short *target, short *src0, unsigned int num_points)
Definition: volk_16i_max_star_16i.h:53
static void volk_16i_max_star_16i_generic(short *target, short *src0, unsigned int num_points)
Definition: volk_16i_max_star_16i.h:113
for i
Definition: volk_config_fixed.tmpl.h:13