doc/doxygen-3.7.2/volk__32fc__s32f__magnitude__16i_8h_source.html

 #ifndef INCLUDED_volk_32fc_s32f_magnitude_16i_a_H

 #define INCLUDED_volk_32fc_s32f_magnitude_16i_a_H


 #include <volk/volk_common.h>

 #include <inttypes.h>

 #include <stdio.h>

 #include <math.h>


 #ifdef LV_HAVE_SSE3

 #include <pmmintrin.h>

 /*!

   \brief Calculates the magnitude of the complexVector, scales the resulting value and stores the results in the magnitudeVector

   \param complexVector The vector containing the complex input values

   \param scalar The scale value multiplied to the magnitude of each complex vector

   \param magnitudeVector The vector containing the real output values

   \param num_points The number of complex values in complexVector to be calculated and stored into cVector

 */

 static inline void volk_32fc_s32f_magnitude_16i_a_sse3(int16_t* magnitudeVector, const lv_32fc_t* complexVector, const float scalar, unsigned int num_points){

   unsigned int number = 0;

   const unsigned int quarterPoints = num_points / 4;


   const float* complexVectorPtr = (const float*)complexVector;

   int16_t* magnitudeVectorPtr = magnitudeVector;


   __m128 vScalar = _mm_set_ps1(scalar);


   __m128 cplxValue1, cplxValue2, result;


   __VOLK_ATTR_ALIGNED(16) float floatBuffer[4];


   for(;number < quarterPoints; number++){

     cplxValue1 = _mm_load_ps(complexVectorPtr);

     complexVectorPtr += 4;


     cplxValue2 = _mm_load_ps(complexVectorPtr);

     complexVectorPtr += 4;


     cplxValue1 = _mm_mul_ps(cplxValue1, cplxValue1); // Square the values

     cplxValue2 = _mm_mul_ps(cplxValue2, cplxValue2); // Square the Values


     result = _mm_hadd_ps(cplxValue1, cplxValue2); // Add the I2 and Q2 values


     result = _mm_sqrt_ps(result);


     result = _mm_mul_ps(result, vScalar);


     _mm_store_ps(floatBuffer, result);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[0]);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[1]);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[2]);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[3]);

   }


   number = quarterPoints * 4;

   magnitudeVectorPtr = &magnitudeVector[number];

   for(; number < num_points; number++){

     float val1Real = *complexVectorPtr++;

     float val1Imag = *complexVectorPtr++;

     *magnitudeVectorPtr++ = (int16_t)(sqrtf((val1Real * val1Real) + (val1Imag * val1Imag)) * scalar);

   }

 }

 #endif /* LV_HAVE_SSE3 */


 #ifdef LV_HAVE_SSE

 #include <xmmintrin.h>

 /*!

   \brief Calculates the magnitude of the complexVector, scales the resulting value and stores the results in the magnitudeVector

   \param complexVector The vector containing the complex input values

   \param scalar The scale value multiplied to the magnitude of each complex vector

   \param magnitudeVector The vector containing the real output values

   \param num_points The number of complex values in complexVector to be calculated and stored into cVector

 */

 static inline void volk_32fc_s32f_magnitude_16i_a_sse(int16_t* magnitudeVector, const lv_32fc_t* complexVector, const float scalar, unsigned int num_points){

   unsigned int number = 0;

   const unsigned int quarterPoints = num_points / 4;


   const float* complexVectorPtr = (const float*)complexVector;

   int16_t* magnitudeVectorPtr = magnitudeVector;


   __m128 vScalar = _mm_set_ps1(scalar);


   __m128 cplxValue1, cplxValue2, iValue, qValue, result;


   __VOLK_ATTR_ALIGNED(16) float floatBuffer[4];


   for(;number < quarterPoints; number++){

     cplxValue1 = _mm_load_ps(complexVectorPtr);

     complexVectorPtr += 4;


     cplxValue2 = _mm_load_ps(complexVectorPtr);

     complexVectorPtr += 4;


     // Arrange in i1i2i3i4 format

     iValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(2,0,2,0));

     // Arrange in q1q2q3q4 format

     qValue = _mm_shuffle_ps(cplxValue1, cplxValue2, _MM_SHUFFLE(3,1,3,1));


     iValue = _mm_mul_ps(iValue, iValue); // Square the I values

     qValue = _mm_mul_ps(qValue, qValue); // Square the Q Values


     result = _mm_add_ps(iValue, qValue); // Add the I2 and Q2 values


     result = _mm_sqrt_ps(result);


     result = _mm_mul_ps(result, vScalar);


     _mm_store_ps(floatBuffer, result);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[0]);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[1]);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[2]);

     *magnitudeVectorPtr++ = (int16_t)(floatBuffer[3]);

   }


   number = quarterPoints * 4;

   magnitudeVectorPtr = &magnitudeVector[number];

   for(; number < num_points; number++){

     float val1Real = *complexVectorPtr++;

     float val1Imag = *complexVectorPtr++;

     *magnitudeVectorPtr++ = (int16_t)(sqrtf((val1Real * val1Real) + (val1Imag * val1Imag)) * scalar);

   }

 }

 #endif /* LV_HAVE_SSE */


 #ifdef LV_HAVE_GENERIC

 /*!

   \brief Calculates the magnitude of the complexVector, scales the resulting value and stores the results in the magnitudeVector

   \param complexVector The vector containing the complex input values

   \param scalar The scale value multiplied to the magnitude of each complex vector

   \param magnitudeVector The vector containing the real output values

   \param num_points The number of complex values in complexVector to be calculated and stored into cVector

 */

 static inline void volk_32fc_s32f_magnitude_16i_generic(int16_t* magnitudeVector, const lv_32fc_t* complexVector, const float scalar, unsigned int num_points){

   const float* complexVectorPtr = (float*)complexVector;

   int16_t* magnitudeVectorPtr = magnitudeVector;

   unsigned int number = 0;

   for(number = 0; number < num_points; number++){

     const float real = *complexVectorPtr++;

     const float imag = *complexVectorPtr++;

     *magnitudeVectorPtr++ = (int16_t)(sqrtf((real*real) + (imag*imag)) * scalar);

   }

 }

 #endif /* LV_HAVE_GENERIC */


 #ifdef LV_HAVE_ORC

 /*!

   \brief Calculates the magnitude of the complexVector, scales the resulting value and stores the results in the magnitudeVector

   \param complexVector The vector containing the complex input values

   \param scalar The scale value multiplied to the magnitude of each complex vector

   \param magnitudeVector The vector containing the real output values

   \param num_points The number of complex values in complexVector to be calculated and stored into cVector

 */

 extern void volk_32fc_s32f_magnitude_16i_a_orc_impl(int16_t* magnitudeVector, const lv_32fc_t* complexVector, const float scalar, unsigned int num_points);

 static inline void volk_32fc_s32f_magnitude_16i_u_orc(int16_t* magnitudeVector, const lv_32fc_t* complexVector, const float scalar, unsigned int num_points){

     volk_32fc_s32f_magnitude_16i_a_orc_impl(magnitudeVector, complexVector, scalar, num_points);

 }

 #endif /* LV_HAVE_ORC */


 #endif /* INCLUDED_volk_32fc_s32f_magnitude_16i_a_H */

math.h

int16_t
signed short int16_t
Definition: stdint.h:76

__VOLK_ATTR_ALIGNED
#define __VOLK_ATTR_ALIGNED(x)
Definition: volk_common.h:27

inttypes.h

lv_32fc_t
float complex lv_32fc_t
Definition: volk_complex.h:56

volk_common.h