53 #ifndef INCLUDED_volk_16ic_deinterleave_real_16i_a_H
54 #define INCLUDED_volk_16ic_deinterleave_real_16i_a_H
60 #include <tmmintrin.h>
63 volk_16ic_deinterleave_real_16i_a_ssse3(
int16_t* iBuffer,
const lv_16sc_t* complexVector,
unsigned int num_points)
65 unsigned int number = 0;
69 __m128i iMoveMask1 = _mm_set_epi8(0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 13, 12, 9, 8, 5, 4, 1, 0);
70 __m128i iMoveMask2 = _mm_set_epi8(13, 12, 9, 8, 5, 4, 1, 0, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80, 0x80);
72 __m128i complexVal1, complexVal2, iOutputVal;
74 unsigned int eighthPoints = num_points / 8;
76 for(number = 0; number < eighthPoints; number++){
77 complexVal1 = _mm_load_si128((__m128i*)complexVectorPtr); complexVectorPtr += 8;
78 complexVal2 = _mm_load_si128((__m128i*)complexVectorPtr); complexVectorPtr += 8;
80 complexVal1 = _mm_shuffle_epi8(complexVal1, iMoveMask1);
81 complexVal2 = _mm_shuffle_epi8(complexVal2, iMoveMask2);
83 iOutputVal = _mm_or_si128(complexVal1, complexVal2);
85 _mm_store_si128((__m128i*)iBufferPtr, iOutputVal);
90 number = eighthPoints * 8;
91 for(; number < num_points; number++){
92 *iBufferPtr++ = *complexVectorPtr++;
100 #include <emmintrin.h>
103 volk_16ic_deinterleave_real_16i_a_sse2(
int16_t* iBuffer,
const lv_16sc_t* complexVector,
unsigned int num_points)
105 unsigned int number = 0;
108 __m128i complexVal1, complexVal2, iOutputVal;
109 __m128i lowMask = _mm_set_epi32(0x0, 0x0, 0xFFFFFFFF, 0xFFFFFFFF);
110 __m128i highMask = _mm_set_epi32(0xFFFFFFFF, 0xFFFFFFFF, 0x0, 0x0);
112 unsigned int eighthPoints = num_points / 8;
114 for(number = 0; number < eighthPoints; number++){
115 complexVal1 = _mm_load_si128((__m128i*)complexVectorPtr); complexVectorPtr += 8;
116 complexVal2 = _mm_load_si128((__m128i*)complexVectorPtr); complexVectorPtr += 8;
118 complexVal1 = _mm_shufflelo_epi16(complexVal1, _MM_SHUFFLE(3,1,2,0));
120 complexVal1 = _mm_shufflehi_epi16(complexVal1, _MM_SHUFFLE(3,1,2,0));
122 complexVal1 = _mm_shuffle_epi32(complexVal1, _MM_SHUFFLE(3,1,2,0));
124 complexVal2 = _mm_shufflelo_epi16(complexVal2, _MM_SHUFFLE(3,1,2,0));
126 complexVal2 = _mm_shufflehi_epi16(complexVal2, _MM_SHUFFLE(3,1,2,0));
128 complexVal2 = _mm_shuffle_epi32(complexVal2, _MM_SHUFFLE(2,0,3,1));
130 iOutputVal = _mm_or_si128(_mm_and_si128(complexVal1, lowMask), _mm_and_si128(complexVal2, highMask));
132 _mm_store_si128((__m128i*)iBufferPtr, iOutputVal);
137 number = eighthPoints * 8;
138 for(; number < num_points; number++){
139 *iBufferPtr++ = *complexVectorPtr++;
145 #ifdef LV_HAVE_GENERIC
148 volk_16ic_deinterleave_real_16i_generic(
int16_t* iBuffer,
const lv_16sc_t* complexVector,
unsigned int num_points)
150 unsigned int number = 0;
153 for(number = 0; number < num_points; number++){
154 *iBufferPtr++ = *complexVectorPtr++;
short complex lv_16sc_t
Definition: volk_complex.h:53
signed short int16_t
Definition: stdint.h:76