Home
last modified time | relevance | path

Searched refs:voutOPQRSTUV (Results 1 – 12 of 12) sorted by relevance

/external/XNNPACK/src/qs8-vaddc/gen/
Dminmax-sse41-mul32-ld32-x32.c78 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32() local
83 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32()
88 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32()
91 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32()
Dminmax-xop-mul32-ld32-x32.c83 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32() local
88 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32()
93 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32()
96 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32()
Dminmax-sse41-mul16-ld64-x32.c93 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32() local
98 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32()
103 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32()
106 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32()
Dminmax-sse2-mul16-ld64-x32.c97 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32() local
102 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32()
107 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32()
110 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32()
Dminmax-wasmsimd-x32.c72 …v128_t voutOPQRSTUV = wasm_i16x8_add_saturate(wasm_i16x8_narrow_i32x4(vaccOPQR, vaccSTUV), voutput… in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x32() local
75 v128_t voutGHIJKLMNOPQRSTUV = wasm_i8x16_narrow_i16x8(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x32()
/external/XNNPACK/src/qs8-vadd/gen/
Dminmax-xop-mul32-ld32-x32.c99 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32() local
104 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32()
109 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32()
112 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32()
Dminmax-sse41-mul32-ld32-x32.c94 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32() local
99 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32()
104 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32()
107 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32()
Dminmax-sse41-mul16-ld64-x32.c123 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32() local
128 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32()
133 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32()
136 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32()
Dminmax-sse2-mul16-ld64-x32.c131 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32() local
136 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32()
141 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32()
144 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32()
Dminmax-wasmsimd-x32.c85 …v128_t voutOPQRSTUV = wasm_i16x8_add_saturate(wasm_i16x8_narrow_i32x4(vaccOPQR, vaccSTUV), voutput… in xnn_qs8_vadd_minmax_ukernel__wasmsimd_x32() local
88 v128_t voutGHIJKLMNOPQRSTUV = wasm_i8x16_narrow_i16x8(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__wasmsimd_x32()
/external/XNNPACK/src/f16-spmm/gen/
D32x1-minmax-neonfp16arith.c69 float16x8_t voutOPQRSTUV = vmulq_f16(vaccOPQRSTUV, vscale); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith() local
73 voutOPQRSTUV = vminq_f16(voutOPQRSTUV, vmax); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith()
77 voutOPQRSTUV = vmaxq_f16(voutOPQRSTUV, vmin); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith()
81 vst1q_f16(o + 24, voutOPQRSTUV); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith()
D32x1-minmax-neonfp16arith-x2.c106 float16x8_t voutOPQRSTUV = vmulq_f16(vaccOPQRSTUV, vscale); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2() local
110 voutOPQRSTUV = vminq_f16(voutOPQRSTUV, vmax); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2()
114 voutOPQRSTUV = vmaxq_f16(voutOPQRSTUV, vmin); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2()
118 vst1q_f16(o + 24, voutOPQRSTUV); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2()