GNU Radio 3.5.3.2 C++ API
volk_32f_s32f_convert_32i_a.h
Go to the documentation of this file.
00001 #ifndef INCLUDED_volk_32f_s32f_convert_32i_a_H
00002 #define INCLUDED_volk_32f_s32f_convert_32i_a_H
00003 
00004 #include <volk/volk_common.h>
00005 #include <inttypes.h>
00006 #include <stdio.h>
00007 
00008 #ifdef LV_HAVE_AVX
00009 #include <immintrin.h>
00010   /*!
00011     \brief Multiplies each point in the input buffer by the scalar value, then converts the result into a 32 bit integer value
00012     \param inputVector The floating point input data buffer
00013     \param outputVector The 32 bit output data buffer
00014     \param scalar The value multiplied against each point in the input buffer
00015     \param num_points The number of data values to be converted
00016   */
00017 static inline void volk_32f_s32f_convert_32i_a_avx(int32_t* outputVector, const float* inputVector, const float scalar, unsigned int num_points){
00018   unsigned int number = 0;
00019 
00020   const unsigned int eighthPoints = num_points / 8;
00021     
00022   const float* inputVectorPtr = (const float*)inputVector;
00023   int32_t* outputVectorPtr = outputVector;
00024 
00025   float min_val = -2147483647;
00026   float max_val = 2147483647;
00027   float r;
00028 
00029   __m256 vScalar = _mm256_set1_ps(scalar);
00030   __m256 inputVal1;
00031   __m256i intInputVal1;
00032   __m256 vmin_val = _mm256_set1_ps(min_val);
00033   __m256 vmax_val = _mm256_set1_ps(max_val);
00034 
00035   for(;number < eighthPoints; number++){
00036     inputVal1 = _mm256_load_ps(inputVectorPtr); inputVectorPtr += 8;
00037 
00038     inputVal1 = _mm256_max_ps(_mm256_min_ps(_mm256_mul_ps(inputVal1, vScalar), vmax_val), vmin_val);
00039     intInputVal1 = _mm256_cvtps_epi32(inputVal1);
00040 
00041     _mm256_store_si256((__m256i*)outputVectorPtr, intInputVal1);
00042     outputVectorPtr += 8;
00043   }
00044 
00045   number = eighthPoints * 8;    
00046   for(; number < num_points; number++){
00047     r = inputVector[number] * scalar;
00048     if(r > max_val)
00049       r = max_val;
00050     else if(r < min_val)
00051       r = min_val;
00052     outputVector[number] = (int32_t)(r);
00053   }
00054 }
00055 #endif /* LV_HAVE_AVX */
00056 
00057 #ifdef LV_HAVE_SSE2
00058 #include <emmintrin.h>
00059   /*!
00060     \brief Multiplies each point in the input buffer by the scalar value, then converts the result into a 32 bit integer value
00061     \param inputVector The floating point input data buffer
00062     \param outputVector The 32 bit output data buffer
00063     \param scalar The value multiplied against each point in the input buffer
00064     \param num_points The number of data values to be converted
00065   */
00066 static inline void volk_32f_s32f_convert_32i_a_sse2(int32_t* outputVector, const float* inputVector, const float scalar, unsigned int num_points){
00067   unsigned int number = 0;
00068 
00069   const unsigned int quarterPoints = num_points / 4;
00070     
00071   const float* inputVectorPtr = (const float*)inputVector;
00072   int32_t* outputVectorPtr = outputVector;
00073 
00074   float min_val = -2147483647;
00075   float max_val = 2147483647;
00076   float r;
00077 
00078   __m128 vScalar = _mm_set_ps1(scalar);
00079   __m128 inputVal1;
00080   __m128i intInputVal1;
00081   __m128 vmin_val = _mm_set_ps1(min_val);
00082   __m128 vmax_val = _mm_set_ps1(max_val);
00083 
00084   for(;number < quarterPoints; number++){
00085     inputVal1 = _mm_load_ps(inputVectorPtr); inputVectorPtr += 4;
00086 
00087     inputVal1 = _mm_max_ps(_mm_min_ps(_mm_mul_ps(inputVal1, vScalar), vmax_val), vmin_val);
00088     intInputVal1 = _mm_cvtps_epi32(inputVal1);
00089 
00090     _mm_store_si128((__m128i*)outputVectorPtr, intInputVal1);
00091     outputVectorPtr += 4;
00092   }
00093 
00094   number = quarterPoints * 4;    
00095   for(; number < num_points; number++){
00096     r = inputVector[number] * scalar;
00097     if(r > max_val)
00098       r = max_val;
00099     else if(r < min_val)
00100       r = min_val;
00101     outputVector[number] = (int32_t)(r);
00102   }
00103 }
00104 #endif /* LV_HAVE_SSE2 */
00105 
00106 #ifdef LV_HAVE_SSE
00107 #include <xmmintrin.h>
00108   /*!
00109     \brief Multiplies each point in the input buffer by the scalar value, then converts the result into a 32 bit integer value
00110     \param inputVector The floating point input data buffer
00111     \param outputVector The 32 bit output data buffer
00112     \param scalar The value multiplied against each point in the input buffer
00113     \param num_points The number of data values to be converted
00114   */
00115 static inline void volk_32f_s32f_convert_32i_a_sse(int32_t* outputVector, const float* inputVector, const float scalar, unsigned int num_points){
00116   unsigned int number = 0;
00117 
00118   const unsigned int quarterPoints = num_points / 4;
00119     
00120   const float* inputVectorPtr = (const float*)inputVector;
00121   int32_t* outputVectorPtr = outputVector;
00122 
00123   float min_val = -2147483647;
00124   float max_val = 2147483647;
00125   float r;
00126 
00127   __m128 vScalar = _mm_set_ps1(scalar);
00128   __m128 ret;
00129   __m128 vmin_val = _mm_set_ps1(min_val);
00130   __m128 vmax_val = _mm_set_ps1(max_val);
00131 
00132   __VOLK_ATTR_ALIGNED(16) float outputFloatBuffer[4];
00133 
00134   for(;number < quarterPoints; number++){
00135     ret = _mm_load_ps(inputVectorPtr);
00136     inputVectorPtr += 4;
00137 
00138     ret = _mm_max_ps(_mm_min_ps(_mm_mul_ps(ret, vScalar), vmax_val), vmin_val);
00139 
00140     _mm_store_ps(outputFloatBuffer, ret);
00141     *outputVectorPtr++ = (int32_t)(outputFloatBuffer[0]);
00142     *outputVectorPtr++ = (int32_t)(outputFloatBuffer[1]);
00143     *outputVectorPtr++ = (int32_t)(outputFloatBuffer[2]);
00144     *outputVectorPtr++ = (int32_t)(outputFloatBuffer[3]);
00145   }
00146 
00147   number = quarterPoints * 4;    
00148   for(; number < num_points; number++){
00149     r = inputVector[number] * scalar;
00150     if(r > max_val)
00151       r = max_val;
00152     else if(r < min_val)
00153       r = min_val;
00154     outputVector[number] = (int32_t)(r);
00155   }
00156 }
00157 #endif /* LV_HAVE_SSE */
00158 
00159 #ifdef LV_HAVE_GENERIC
00160   /*!
00161     \brief Multiplies each point in the input buffer by the scalar value, then converts the result into a 32 bit integer value
00162     \param inputVector The floating point input data buffer
00163     \param outputVector The 32 bit output data buffer
00164     \param scalar The value multiplied against each point in the input buffer
00165     \param num_points The number of data values to be converted
00166   */
00167 static inline void volk_32f_s32f_convert_32i_a_generic(int32_t* outputVector, const float* inputVector, const float scalar, unsigned int num_points){
00168   int32_t* outputVectorPtr = outputVector;
00169   const float* inputVectorPtr = inputVector;
00170   unsigned int number = 0;
00171   float min_val = -2147483647;
00172   float max_val = 2147483647;
00173   float r;
00174 
00175   for(number = 0; number < num_points; number++){
00176     r = *inputVectorPtr++ * scalar;
00177     if(r > max_val)
00178       r = max_val;
00179     else if(r < min_val)
00180       r = min_val;
00181     *outputVectorPtr++ = (int32_t)(r);
00182   }
00183 }
00184 #endif /* LV_HAVE_GENERIC */
00185 
00186 
00187 
00188 
00189 #endif /* INCLUDED_volk_32f_s32f_convert_32i_a_H */