Searched refs:_mm512_rsqrt14_ps (Results 1 – 18 of 18) sorted by relevance
40 const __m512 vrsqrtx0 = _mm512_rsqrt14_ps(vx0); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()41 const __m512 vrsqrtx1 = _mm512_rsqrt14_ps(vx1); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()42 const __m512 vrsqrtx2 = _mm512_rsqrt14_ps(vx2); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()43 const __m512 vrsqrtx3 = _mm512_rsqrt14_ps(vx3); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()44 const __m512 vrsqrtx4 = _mm512_rsqrt14_ps(vx4); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()45 const __m512 vrsqrtx5 = _mm512_rsqrt14_ps(vx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()46 const __m512 vrsqrtx6 = _mm512_rsqrt14_ps(vx6); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()47 const __m512 vrsqrtx7 = _mm512_rsqrt14_ps(vx7); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()124 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()144 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x128()
39 const __m512 vrsqrtx0 = _mm512_rsqrt14_ps(vx0); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()40 const __m512 vrsqrtx1 = _mm512_rsqrt14_ps(vx1); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()41 const __m512 vrsqrtx2 = _mm512_rsqrt14_ps(vx2); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()42 const __m512 vrsqrtx3 = _mm512_rsqrt14_ps(vx3); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()43 const __m512 vrsqrtx4 = _mm512_rsqrt14_ps(vx4); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()44 const __m512 vrsqrtx5 = _mm512_rsqrt14_ps(vx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()45 const __m512 vrsqrtx6 = _mm512_rsqrt14_ps(vx6); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()114 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()134 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x112()
38 const __m512 vrsqrtx0 = _mm512_rsqrt14_ps(vx0); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()39 const __m512 vrsqrtx1 = _mm512_rsqrt14_ps(vx1); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()40 const __m512 vrsqrtx2 = _mm512_rsqrt14_ps(vx2); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()41 const __m512 vrsqrtx3 = _mm512_rsqrt14_ps(vx3); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()42 const __m512 vrsqrtx4 = _mm512_rsqrt14_ps(vx4); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()43 const __m512 vrsqrtx5 = _mm512_rsqrt14_ps(vx5); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()104 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()124 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x96()
37 const __m512 vrsqrtx0 = _mm512_rsqrt14_ps(vx0); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80()38 const __m512 vrsqrtx1 = _mm512_rsqrt14_ps(vx1); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80()39 const __m512 vrsqrtx2 = _mm512_rsqrt14_ps(vx2); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80()40 const __m512 vrsqrtx3 = _mm512_rsqrt14_ps(vx3); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80()41 const __m512 vrsqrtx4 = _mm512_rsqrt14_ps(vx4); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80()94 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80()114 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x80()
36 const __m512 vrsqrtx0 = _mm512_rsqrt14_ps(vx0); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64()37 const __m512 vrsqrtx1 = _mm512_rsqrt14_ps(vx1); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64()38 const __m512 vrsqrtx2 = _mm512_rsqrt14_ps(vx2); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64()39 const __m512 vrsqrtx3 = _mm512_rsqrt14_ps(vx3); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64()84 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64()104 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x64()
35 const __m512 vrsqrtx0 = _mm512_rsqrt14_ps(vx0); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48()36 const __m512 vrsqrtx1 = _mm512_rsqrt14_ps(vx1); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48()37 const __m512 vrsqrtx2 = _mm512_rsqrt14_ps(vx2); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48()74 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48()94 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x48()
34 const __m512 vrsqrtx0 = _mm512_rsqrt14_ps(vx0); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x32()35 const __m512 vrsqrtx1 = _mm512_rsqrt14_ps(vx1); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x32()64 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x32()84 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x32()
33 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x16()53 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_f32_vsqrt_ukernel__avx512f_nr1fma1adj_x16()
37 const __m512 vrsqrtx${ABC[N]} = _mm512_rsqrt14_ps(vx${ABC[N]});65 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx);85 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx);
28 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_math_f32_sqrt__avx512f_nr1fma()
28 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_math_f32_sqrt__avx512f_nr2fma()
28 const __m512 vrsqrtx = _mm512_rsqrt14_ps(vx); in xnn_math_f32_sqrt__avx512f_nr1fma1adj()
269 Packet16f x = _mm512_mask_blend_ps(non_zero_mask, _mm512_rsqrt14_ps(_x),337 _mm512_rsqrt14_ps(_x));
150 SIMD_WRAPPER_1_(rsqrt_ps, _mm512_rsqrt14_ps); // return 1.0f / sqrt(a)
117 return _mm512_rsqrt14_ps(a); in test_mm512_rsqrt14_ps()
131 return _mm512_rsqrt14_ps(a); in test_mm512_rsqrt14_ps()
1594 _mm512_rsqrt14_ps(__m512 __A) in _mm512_rsqrt14_ps() function
1585 _mm512_rsqrt14_ps(__m512 __A) in _mm512_rsqrt14_ps() function