/external/XNNPACK/src/qs8-vaddc/gen/ |
D | minmax-sse41-mul32-ld32-x32.c | 78 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32() local 83 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32() 88 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32() 91 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul32_ld32_x32()
|
D | minmax-xop-mul32-ld32-x32.c | 83 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32() local 88 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32() 93 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32() 96 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__xop_mul32_ld32_x32()
|
D | minmax-sse41-mul16-ld64-x32.c | 93 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32() local 98 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32() 103 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32() 106 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__sse41_mul16_ld64_x32()
|
D | minmax-sse2-mul16-ld64-x32.c | 97 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32() local 102 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32() 107 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32() 110 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__sse2_mul16_ld64_x32()
|
D | minmax-wasmsimd-x32.c | 72 …v128_t voutOPQRSTUV = wasm_i16x8_add_saturate(wasm_i16x8_narrow_i32x4(vaccOPQR, vaccSTUV), voutput… in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x32() local 75 v128_t voutGHIJKLMNOPQRSTUV = wasm_i8x16_narrow_i16x8(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vaddc_minmax_ukernel__wasmsimd_x32()
|
/external/XNNPACK/src/qs8-vadd/gen/ |
D | minmax-xop-mul32-ld32-x32.c | 99 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32() local 104 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32() 109 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32() 112 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__xop_mul32_ld32_x32()
|
D | minmax-sse41-mul32-ld32-x32.c | 94 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32() local 99 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32() 104 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32() 107 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__sse41_mul32_ld32_x32()
|
D | minmax-sse41-mul16-ld64-x32.c | 123 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32() local 128 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32() 133 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32() 136 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__sse41_mul16_ld64_x32()
|
D | minmax-sse2-mul16-ld64-x32.c | 131 __m128i voutOPQRSTUV = _mm_adds_epi16(_mm_packs_epi32(vaccOPQR, vaccSTUV), voutput_zero_point); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32() local 136 voutOPQRSTUV = _mm_max_epi16(voutOPQRSTUV, voutput_min); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32() 141 voutOPQRSTUV = _mm_min_epi16(voutOPQRSTUV, voutput_max); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32() 144 const __m128i voutGHIJKLMNOPQRSTUV = _mm_packs_epi16(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__sse2_mul16_ld64_x32()
|
D | minmax-wasmsimd-x32.c | 85 …v128_t voutOPQRSTUV = wasm_i16x8_add_saturate(wasm_i16x8_narrow_i32x4(vaccOPQR, vaccSTUV), voutput… in xnn_qs8_vadd_minmax_ukernel__wasmsimd_x32() local 88 v128_t voutGHIJKLMNOPQRSTUV = wasm_i8x16_narrow_i16x8(voutGHIJKLMN, voutOPQRSTUV); in xnn_qs8_vadd_minmax_ukernel__wasmsimd_x32()
|
/external/XNNPACK/src/f16-spmm/gen/ |
D | 32x1-minmax-neonfp16arith.c | 69 float16x8_t voutOPQRSTUV = vmulq_f16(vaccOPQRSTUV, vscale); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith() local 73 voutOPQRSTUV = vminq_f16(voutOPQRSTUV, vmax); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith() 77 voutOPQRSTUV = vmaxq_f16(voutOPQRSTUV, vmin); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith() 81 vst1q_f16(o + 24, voutOPQRSTUV); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith()
|
D | 32x1-minmax-neonfp16arith-x2.c | 106 float16x8_t voutOPQRSTUV = vmulq_f16(vaccOPQRSTUV, vscale); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2() local 110 voutOPQRSTUV = vminq_f16(voutOPQRSTUV, vmax); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2() 114 voutOPQRSTUV = vmaxq_f16(voutOPQRSTUV, vmin); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2() 118 vst1q_f16(o + 24, voutOPQRSTUV); in xnn_f16_spmm_minmax_ukernel_32x1__neonfp16arith_x2()
|