1 #ifndef INCLUDED_volk_8i_convert_16i_u_H
2 #define INCLUDED_volk_8i_convert_16i_u_H
17 static inline void volk_8i_convert_16i_u_sse4_1(
int16_t* outputVector,
const int8_t* inputVector,
unsigned int num_points){
18 unsigned int number = 0;
19 const unsigned int sixteenthPoints = num_points / 16;
21 const __m128i* inputVectorPtr = (
const __m128i*)inputVector;
22 __m128i* outputVectorPtr = (__m128i*)outputVector;
26 for(;number < sixteenthPoints; number++){
27 inputVal = _mm_loadu_si128(inputVectorPtr);
28 ret = _mm_cvtepi8_epi16(inputVal);
29 ret = _mm_slli_epi16(ret, 8);
30 _mm_storeu_si128(outputVectorPtr, ret);
34 inputVal = _mm_srli_si128(inputVal, 8);
35 ret = _mm_cvtepi8_epi16(inputVal);
36 ret = _mm_slli_epi16(ret, 8);
37 _mm_storeu_si128(outputVectorPtr, ret);
44 number = sixteenthPoints * 16;
45 for(; number < num_points; number++){
46 outputVector[number] = (
int16_t)(inputVector[number])*256;
51 #ifdef LV_HAVE_GENERIC
59 static inline void volk_8i_convert_16i_u_generic(
int16_t* outputVector,
const int8_t* inputVector,
unsigned int num_points){
60 int16_t* outputVectorPtr = outputVector;
61 const int8_t* inputVectorPtr = inputVector;
62 unsigned int number = 0;
64 for(number = 0; number < num_points; number++){
65 *outputVectorPtr++ = ((
int16_t)(*inputVectorPtr++)) * 256;