1 #ifndef INCLUDED_volk_16i_convert_8i_a_H
2 #define INCLUDED_volk_16i_convert_8i_a_H
15 static inline void volk_16i_convert_8i_a_sse2(int8_t* outputVector,
const int16_t* inputVector,
unsigned int num_points){
16 unsigned int number = 0;
17 const unsigned int sixteenthPoints = num_points / 16;
19 int8_t* outputVectorPtr = outputVector;
20 int16_t* inputPtr = (int16_t*)inputVector;
25 for(;number < sixteenthPoints; number++){
28 inputVal1 = _mm_load_si128((__m128i*)inputPtr); inputPtr += 8;
29 inputVal2 = _mm_load_si128((__m128i*)inputPtr); inputPtr += 8;
31 inputVal1 = _mm_srai_epi16(inputVal1, 8);
32 inputVal2 = _mm_srai_epi16(inputVal2, 8);
34 ret = _mm_packs_epi16(inputVal1, inputVal2);
36 _mm_store_si128((__m128i*)outputVectorPtr, ret);
38 outputVectorPtr += 16;
41 number = sixteenthPoints * 16;
42 for(; number < num_points; number++){
43 outputVector[number] =(int8_t)(inputVector[number] >> 8);
48 #ifdef LV_HAVE_GENERIC
55 static inline void volk_16i_convert_8i_a_generic(int8_t* outputVector,
const int16_t* inputVector,
unsigned int num_points){
56 int8_t* outputVectorPtr = outputVector;
57 const int16_t* inputVectorPtr = inputVector;
58 unsigned int number = 0;
60 for(number = 0; number < num_points; number++){
61 *outputVectorPtr++ = ((int8_t)(*inputVectorPtr++ >> 8));