23 #ifndef INCLUDED_volk_16ic_s32f_deinterleave_32f_x2_a_H
24 #define INCLUDED_volk_16ic_s32f_deinterleave_32f_x2_a_H
31 #include <xmmintrin.h>
40 static inline void volk_16ic_s32f_deinterleave_32f_x2_a_sse(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points){
41 float* iBufferPtr = iBuffer;
42 float* qBufferPtr = qBuffer;
45 const uint64_t quarterPoints = num_points / 4;
46 __m128 cplxValue1, cplxValue2, iValue, qValue;
48 __m128 invScalar = _mm_set_ps1(1.0/scalar);
53 for(;number < quarterPoints; number++){
55 floatBuffer[0] = (float)(complexVectorPtr[0]);
56 floatBuffer[1] = (float)(complexVectorPtr[1]);
57 floatBuffer[2] = (float)(complexVectorPtr[2]);
58 floatBuffer[3] = (float)(complexVectorPtr[3]);
60 floatBuffer[4] = (float)(complexVectorPtr[4]);
61 floatBuffer[5] = (float)(complexVectorPtr[5]);
62 floatBuffer[6] = (float)(complexVectorPtr[6]);
63 floatBuffer[7] = (float)(complexVectorPtr[7]);
65 cplxValue1 = _mm_load_ps(&floatBuffer[0]);
66 cplxValue2 = _mm_load_ps(&floatBuffer[4]);
68 complexVectorPtr += 8;
70 cplxValue1 = _mm_mul_ps(cplxValue1, invScalar);
71 cplxValue2 = _mm_mul_ps(cplxValue2, invScalar);
74 iValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(2,0,2,0));
76 qValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(3,1,3,1));
78 _mm_store_ps(iBufferPtr, iValue);
79 _mm_store_ps(qBufferPtr, qValue);
85 number = quarterPoints * 4;
86 complexVectorPtr = (
int16_t*)&complexVector[number];
87 for(; number < num_points; number++){
88 *iBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
89 *qBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
94 #ifdef LV_HAVE_GENERIC
103 static inline void volk_16ic_s32f_deinterleave_32f_x2_generic(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points){
105 float* iBufferPtr = iBuffer;
106 float* qBufferPtr = qBuffer;
108 for(number = 0; number < num_points; number++){
109 *iBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
110 *qBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
124 extern void volk_16ic_s32f_deinterleave_32f_x2_a_orc_impl(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points);
125 static inline void volk_16ic_s32f_deinterleave_32f_x2_u_orc(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points){
126 volk_16ic_s32f_deinterleave_32f_x2_a_orc_impl(iBuffer, qBuffer, complexVector, scalar, num_points);
short complex lv_16sc_t
Definition: volk_complex.h:53
signed short int16_t
Definition: stdint.h:76
unsigned __int64 uint64_t
Definition: stdint.h:90
#define __VOLK_ATTR_ALIGNED(x)
Definition: volk_common.h:27