Home
last modified time | relevance | path

Searched refs:vqmax (Results 1 – 23 of 23) sorted by relevance

/external/XNNPACK/src/qs8-requantization/
Dfp32-sse2.c34 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qs8_requantize_fp32__sse2() local
76 const __m128i xy_clamped = _mm_max_epi16(_mm_min_epi16(xy_packed, vqmax), vqmin); in xnn_qs8_requantize_fp32__sse2()
77 const __m128i zw_clamped = _mm_max_epi16(_mm_min_epi16(zw_packed, vqmax), vqmin); in xnn_qs8_requantize_fp32__sse2()
Dprecise-ssse3.c43 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qs8_requantize_precise__ssse3() local
103 const __m128i xy_clamped = _mm_max_epi16(_mm_min_epi16(xy_packed, vqmax), vqmin); in xnn_qs8_requantize_precise__ssse3()
104 const __m128i zw_clamped = _mm_max_epi16(_mm_min_epi16(zw_packed, vqmax), vqmin); in xnn_qs8_requantize_precise__ssse3()
Dfp32-sse4.c34 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qs8_requantize_fp32__sse4() local
77 const __m128i xyzw_clamped = _mm_max_epi8(_mm_min_epi8(xyzw_packed, vqmax), vqmin); in xnn_qs8_requantize_fp32__sse4()
Dprecise-sse2.c43 const __m128i vqmax = _mm_set1_epi8((short) qmax); in xnn_qs8_requantize_precise__sse2() local
108 const __m128i xy_clamped = _mm_max_epi16(_mm_min_epi16(xy_packed, vqmax), vqmin); in xnn_qs8_requantize_precise__sse2()
109 const __m128i zw_clamped = _mm_max_epi16(_mm_min_epi16(zw_packed, vqmax), vqmin); in xnn_qs8_requantize_precise__sse2()
Dq31-neon.c51 const int8x16_t vqmax = vdupq_n_s8(qmax); in xnn_qs8_requantize_q31__neon() local
92 const int8x16_t xyzw_clamped = vmaxq_s8(vminq_s8(xyzw_packed, vqmax), vqmin); in xnn_qs8_requantize_q31__neon()
Dfp32-neon.c35 const int8x16_t vqmax = vdupq_n_s8(qmax); in xnn_qs8_requantize_fp32__neon() local
77 const int8x16_t xyzw_clamped = vmaxq_s8(vminq_s8(xyzw_packed, vqmax), vqmin); in xnn_qs8_requantize_fp32__neon()
Dq31-ssse3.c49 const __m128i vqmax = _mm_set1_epi16((short) qmax); in xnn_qs8_requantize_q31__ssse3() local
160 const __m128i xy_clamped = _mm_max_epi16(_mm_min_epi16(xy_packed, vqmax), vqmin); in xnn_qs8_requantize_q31__ssse3()
161 const __m128i zw_clamped = _mm_max_epi16(_mm_min_epi16(zw_packed, vqmax), vqmin); in xnn_qs8_requantize_q31__ssse3()
Dq31-sse2.c49 const __m128i vqmax = _mm_set1_epi16((short) qmax); in xnn_qs8_requantize_q31__sse2() local
160 const __m128i xy_clamped = _mm_max_epi16(_mm_min_epi16(xy_packed, vqmax), vqmin); in xnn_qs8_requantize_q31__sse2()
161 const __m128i zw_clamped = _mm_max_epi16(_mm_min_epi16(zw_packed, vqmax), vqmin); in xnn_qs8_requantize_q31__sse2()
Dprecise-sse4.c43 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qs8_requantize_precise__sse4() local
96 const __m128i xyzw_clamped = _mm_max_epi8(_mm_min_epi8(xyzw_packed, vqmax), vqmin); in xnn_qs8_requantize_precise__sse4()
Dq31-sse4.c49 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qs8_requantize_q31__sse4() local
112 const __m128i xyzw_clamped = _mm_max_epi8(_mm_min_epi8(xyzw_packed, vqmax), vqmin); in xnn_qs8_requantize_q31__sse4()
Dq31-wasmsimd.c52 const v128_t vqmax = wasm_i8x16_splat(qmax); in xnn_qs8_requantize_q31__wasmsimd() local
115 const v128_t xyzw_clamped = wasm_i8x16_min(wasm_i8x16_max(xyzw_packed, vqmin), vqmax); in xnn_qs8_requantize_q31__wasmsimd()
Dprecise-neon.c47 const int8x16_t vqmax = vdupq_n_s8(qmax); in xnn_qs8_requantize_precise__neon() local
129 const int8x16_t xyzw_clamped = vmaxq_s8(vminq_s8(xyzw_packed, vqmax), vqmin); in xnn_qs8_requantize_precise__neon()
/external/XNNPACK/src/qu8-requantization/
Dfp32-sse2.c34 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qu8_requantize_fp32__sse2() local
77 const __m128i xyzw_clamped = _mm_max_epu8(_mm_min_epu8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_fp32__sse2()
Dq31-neon.c51 const uint8x16_t vqmax = vdupq_n_u8(qmax); in xnn_qu8_requantize_q31__neon() local
92 const uint8x16_t xyzw_clamped = vmaxq_u8(vminq_u8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_q31__neon()
Dfp32-neon.c35 const uint8x16_t vqmax = vdupq_n_u8(qmax); in xnn_qu8_requantize_fp32__neon() local
77 const uint8x16_t xyzw_clamped = vmaxq_u8(vminq_u8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_fp32__neon()
Dprecise-sse4.c43 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qu8_requantize_precise__sse4() local
96 const __m128i xyzw_clamped = _mm_max_epu8(_mm_min_epu8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_precise__sse4()
Dprecise-ssse3.c43 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qu8_requantize_precise__ssse3() local
104 const __m128i xyzw_clamped = _mm_max_epu8(_mm_min_epu8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_precise__ssse3()
Dq31-sse4.c49 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qu8_requantize_q31__sse4() local
112 const __m128i xyzw_clamped = _mm_max_epu8(_mm_min_epu8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_q31__sse4()
Dprecise-sse2.c43 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qu8_requantize_precise__sse2() local
109 const __m128i xyzw_clamped = _mm_max_epu8(_mm_min_epu8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_precise__sse2()
Dq31-wasmsimd.c52 const v128_t vqmax = wasm_i8x16_splat((int8_t) qmax); in xnn_qu8_requantize_q31__wasmsimd() local
115 const v128_t xyzw_clamped = wasm_u8x16_min(wasm_u8x16_max(xyzw_packed, vqmin), vqmax); in xnn_qu8_requantize_q31__wasmsimd()
Dprecise-neon.c47 const uint8x16_t vqmax = vdupq_n_u8(qmax); in xnn_qu8_requantize_precise__neon() local
129 const uint8x16_t xyzw_clamped = vmaxq_u8(vminq_u8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_precise__neon()
Dq31-ssse3.c49 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qu8_requantize_q31__ssse3() local
161 const __m128i xyzw_clamped = _mm_max_epu8(_mm_min_epu8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_q31__ssse3()
Dq31-sse2.c49 const __m128i vqmax = _mm_set1_epi8((char) qmax); in xnn_qu8_requantize_q31__sse2() local
161 const __m128i xyzw_clamped = _mm_max_epu8(_mm_min_epu8(xyzw_packed, vqmax), vqmin); in xnn_qu8_requantize_q31__sse2()