/external/XNNPACK/src/qu8-requantization/ |
D | q31-scalar.c | 72 const int32_t w_q31product = (int32_t)(uint32_t)((uint64_t)(w_product + q31rounding) >> 31); in xnn_qu8_requantize_q31__scalar() local 101 const int32_t w_remainder = (w_q31product & remainder_mask) - (int32_t)(w_q31product < 0); in xnn_qu8_requantize_q31__scalar() 106 const int32_t w_scaled = asr_s32(w_q31product, shift) + (int32_t)(w_remainder > threshold); in xnn_qu8_requantize_q31__scalar()
|
D | q31-sse4.c | 89 const __m128i w_q31product = _mm_blend_epi16(w_q31product_even, w_q31product_odd, 0xCC); in xnn_qu8_requantize_q31__sse4() local 98 …_mm_add_epi32(_mm_and_si128(w_q31product, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), w… in xnn_qu8_requantize_q31__sse4() 107 … _mm_sub_epi32(_mm_sra_epi32(w_q31product, vshift), _mm_cmpgt_epi32(w_remainder, vthreshold)); in xnn_qu8_requantize_q31__sse4()
|
D | q31-wasmsimd.c | 92 const v128_t w_q31product = wasm_v32x4_shuffle(w_product_lo, w_product_hi, 1, 3, 5, 7); in xnn_qu8_requantize_q31__wasmsimd() local 101 … wasm_i32x4_add(wasm_v128_and(w_q31product, vremainder_mask), wasm_i32x4_lt(w_q31product, vzero)); in xnn_qu8_requantize_q31__wasmsimd() 110 wasm_i32x4_sub(wasm_i32x4_shr(w_q31product, shift), wasm_i32x4_gt(w_remainder, vthreshold)); in xnn_qu8_requantize_q31__wasmsimd()
|
D | q31-ssse3.c | 138 const __m128i w_q31product = _mm_shuffle_epi32(w_q31product_0213, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qu8_requantize_q31__ssse3() local 147 …_mm_add_epi32(_mm_and_si128(w_q31product, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), w… in xnn_qu8_requantize_q31__ssse3() 156 … _mm_sub_epi32(_mm_sra_epi32(w_q31product, vshift), _mm_cmpgt_epi32(w_remainder, vthreshold)); in xnn_qu8_requantize_q31__ssse3()
|
D | q31-sse2.c | 138 const __m128i w_q31product = _mm_shuffle_epi32(w_q31product_0213, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qu8_requantize_q31__sse2() local 147 …_mm_add_epi32(_mm_and_si128(w_q31product, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), w… in xnn_qu8_requantize_q31__sse2() 156 … _mm_sub_epi32(_mm_sra_epi32(w_q31product, vshift), _mm_cmpgt_epi32(w_remainder, vthreshold)); in xnn_qu8_requantize_q31__sse2()
|
/external/XNNPACK/src/qs8-requantization/ |
D | q31-scalar.c | 72 const int32_t w_q31product = (int32_t) (uint32_t) ((uint64_t) (w_product + q31rounding) >> 31); in xnn_qs8_requantize_q31__scalar() local 101 const int32_t w_remainder = (w_q31product & remainder_mask) - (int32_t) (w_q31product < 0); in xnn_qs8_requantize_q31__scalar() 106 const int32_t w_scaled = asr_s32(w_q31product, shift) + (int32_t) (w_remainder > threshold); in xnn_qs8_requantize_q31__scalar()
|
D | q31-sse4.c | 89 const __m128i w_q31product = _mm_blend_epi16(w_q31product_even, w_q31product_odd, 0xCC); in xnn_qs8_requantize_q31__sse4() local 98 …_mm_add_epi32(_mm_and_si128(w_q31product, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), w… in xnn_qs8_requantize_q31__sse4() 107 … _mm_sub_epi32(_mm_sra_epi32(w_q31product, vshift), _mm_cmpgt_epi32(w_remainder, vthreshold)); in xnn_qs8_requantize_q31__sse4()
|
D | q31-wasmsimd.c | 92 const v128_t w_q31product = wasm_v32x4_shuffle(w_product_lo, w_product_hi, 1, 3, 5, 7); in xnn_qs8_requantize_q31__wasmsimd() local 101 … wasm_i32x4_add(wasm_v128_and(w_q31product, vremainder_mask), wasm_i32x4_lt(w_q31product, vzero)); in xnn_qs8_requantize_q31__wasmsimd() 110 wasm_i32x4_sub(wasm_i32x4_shr(w_q31product, shift), wasm_i32x4_gt(w_remainder, vthreshold)); in xnn_qs8_requantize_q31__wasmsimd()
|
D | q31-ssse3.c | 138 const __m128i w_q31product = _mm_shuffle_epi32(w_q31product_0213, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qs8_requantize_q31__ssse3() local 147 …_mm_add_epi32(_mm_and_si128(w_q31product, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), w… in xnn_qs8_requantize_q31__ssse3() 156 … _mm_sub_epi32(_mm_sra_epi32(w_q31product, vshift), _mm_cmpgt_epi32(w_remainder, vthreshold)); in xnn_qs8_requantize_q31__ssse3()
|
D | q31-sse2.c | 138 const __m128i w_q31product = _mm_shuffle_epi32(w_q31product_0213, _MM_SHUFFLE(3, 1, 2, 0)); in xnn_qs8_requantize_q31__sse2() local 147 …_mm_add_epi32(_mm_and_si128(w_q31product, vremainder_mask), _mm_cmpgt_epi32(_mm_setzero_si128(), w… in xnn_qs8_requantize_q31__sse2() 156 … _mm_sub_epi32(_mm_sra_epi32(w_q31product, vshift), _mm_cmpgt_epi32(w_remainder, vthreshold)); in xnn_qs8_requantize_q31__sse2()
|