1 #ifndef INCLUDED_volk_16ic_s32f_deinterleave_32f_x2_a_H
2 #define INCLUDED_volk_16ic_s32f_deinterleave_32f_x2_a_H
18 static inline void volk_16ic_s32f_deinterleave_32f_x2_a_sse(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points){
19 float* iBufferPtr = iBuffer;
20 float* qBufferPtr = qBuffer;
23 const uint64_t quarterPoints = num_points / 4;
24 __m128 cplxValue1, cplxValue2, iValue, qValue;
26 __m128 invScalar = _mm_set_ps1(1.0/scalar);
31 for(;number < quarterPoints; number++){
33 floatBuffer[0] = (float)(complexVectorPtr[0]);
34 floatBuffer[1] = (float)(complexVectorPtr[1]);
35 floatBuffer[2] = (float)(complexVectorPtr[2]);
36 floatBuffer[3] = (float)(complexVectorPtr[3]);
38 floatBuffer[4] = (float)(complexVectorPtr[4]);
39 floatBuffer[5] = (float)(complexVectorPtr[5]);
40 floatBuffer[6] = (float)(complexVectorPtr[6]);
41 floatBuffer[7] = (float)(complexVectorPtr[7]);
43 cplxValue1 = _mm_load_ps(&floatBuffer[0]);
44 cplxValue2 = _mm_load_ps(&floatBuffer[4]);
46 complexVectorPtr += 8;
48 cplxValue1 = _mm_mul_ps(cplxValue1, invScalar);
49 cplxValue2 = _mm_mul_ps(cplxValue2, invScalar);
52 iValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(2,0,2,0));
54 qValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(3,1,3,1));
56 _mm_store_ps(iBufferPtr, iValue);
57 _mm_store_ps(qBufferPtr, qValue);
63 number = quarterPoints * 4;
64 complexVectorPtr = (
int16_t*)&complexVector[number];
65 for(; number < num_points; number++){
66 *iBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
67 *qBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
72 #ifdef LV_HAVE_GENERIC
81 static inline void volk_16ic_s32f_deinterleave_32f_x2_generic(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points){
83 float* iBufferPtr = iBuffer;
84 float* qBufferPtr = qBuffer;
86 for(number = 0; number < num_points; number++){
87 *iBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
88 *qBufferPtr++ = (float)(*complexVectorPtr++) / scalar;
102 extern void volk_16ic_s32f_deinterleave_32f_x2_a_orc_impl(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points);
103 static inline void volk_16ic_s32f_deinterleave_32f_x2_u_orc(
float* iBuffer,
float* qBuffer,
const lv_16sc_t* complexVector,
const float scalar,
unsigned int num_points){
104 volk_16ic_s32f_deinterleave_32f_x2_a_orc_impl(iBuffer, qBuffer, complexVector, scalar, num_points);
short complex lv_16sc_t
Definition: volk_complex.h:53
signed short int16_t
Definition: stdint.h:76
unsigned __int64 uint64_t
Definition: stdint.h:90
#define __VOLK_ATTR_ALIGNED(x)
Definition: volk_common.h:27