GNU Radio 3.5.3.2 C++ API
|
00001 #ifndef INCLUDED_volk_32f_sqrt_32f_a_H 00002 #define INCLUDED_volk_32f_sqrt_32f_a_H 00003 00004 #include <inttypes.h> 00005 #include <stdio.h> 00006 #include <math.h> 00007 00008 #ifdef LV_HAVE_SSE 00009 #include <xmmintrin.h> 00010 /*! 00011 \brief Sqrts the two input vectors and store their results in the third vector 00012 \param cVector The vector where the results will be stored 00013 \param aVector One of the vectors to be sqrted 00014 \param num_points The number of values in aVector and bVector to be sqrted together and stored into cVector 00015 */ 00016 static inline void volk_32f_sqrt_32f_a_sse(float* cVector, const float* aVector, unsigned int num_points){ 00017 unsigned int number = 0; 00018 const unsigned int quarterPoints = num_points / 4; 00019 00020 float* cPtr = cVector; 00021 const float* aPtr = aVector; 00022 00023 __m128 aVal, cVal; 00024 for(;number < quarterPoints; number++){ 00025 00026 aVal = _mm_load_ps(aPtr); 00027 00028 cVal = _mm_sqrt_ps(aVal); 00029 00030 _mm_store_ps(cPtr,cVal); // Store the results back into the C container 00031 00032 aPtr += 4; 00033 cPtr += 4; 00034 } 00035 00036 number = quarterPoints * 4; 00037 for(;number < num_points; number++){ 00038 *cPtr++ = sqrtf(*aPtr++); 00039 } 00040 } 00041 #endif /* LV_HAVE_SSE */ 00042 00043 #ifdef LV_HAVE_GENERIC 00044 /*! 00045 \brief Sqrts the two input vectors and store their results in the third vector 00046 \param cVector The vector where the results will be stored 00047 \param aVector One of the vectors to be sqrted 00048 \param num_points The number of values in aVector and bVector to be sqrted together and stored into cVector 00049 */ 00050 static inline void volk_32f_sqrt_32f_a_generic(float* cVector, const float* aVector, unsigned int num_points){ 00051 float* cPtr = cVector; 00052 const float* aPtr = aVector; 00053 unsigned int number = 0; 00054 00055 for(number = 0; number < num_points; number++){ 00056 *cPtr++ = sqrtf(*aPtr++); 00057 } 00058 } 00059 #endif /* LV_HAVE_GENERIC */ 00060 00061 #ifdef LV_HAVE_ORC 00062 extern void volk_32f_sqrt_32f_a_orc_impl(float *, const float*, unsigned int); 00063 /*! 00064 \brief Sqrts the two input vectors and store their results in the third vector 00065 \param cVector The vector where the results will be stored 00066 \param aVector One of the vectors to be sqrted 00067 \param num_points The number of values in aVector and bVector to be sqrted together and stored into cVector 00068 */ 00069 static inline void volk_32f_sqrt_32f_a_orc(float* cVector, const float* aVector, unsigned int num_points){ 00070 volk_32f_sqrt_32f_a_orc_impl(cVector, aVector, num_points); 00071 } 00072 00073 #endif /* LV_HAVE_ORC */ 00074 00075 00076 00077 #endif /* INCLUDED_volk_32f_sqrt_32f_a_H */