Home
last modified time | relevance | path

Searched refs:_mm512_cvtepi8_epi16 (Results 1 – 16 of 16) sorted by relevance

/external/ruy/ruy/
Dpack_avx512.cc234 sums_8x4_16bit = _mm512_cvtepi8_epi16(r0_0);
236 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r0_1));
238 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r1_0));
240 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r1_1));
242 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r2_0));
244 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r2_1));
246 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r3_0));
248 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r3_1));
385 sums_8x4_16bit = _mm512_cvtepi8_epi16(r0_0);
387 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r0_1));
[all …]
Dkernel_avx512.cc301 _mm512_cvtepi8_epi16(rhs_data_bottom_lane);
303 _mm512_cvtepi8_epi16(rhs_data_top_lane);
313 _mm512_cvtepi8_epi16(_mm512_cvtepi32_epi16(lhs_data));
315 const __m512i lhs_16_bit_high = _mm512_cvtepi8_epi16(
745 _mm512_cvtepi8_epi16(_mm512_cvtepi32_epi16(lhs_data));
747 const __m512i lhs_16_bit_high = _mm512_cvtepi8_epi16(
/external/XNNPACK/src/qs8-gemm/gen/
D1x16c8-minmax-avx512skx.c66 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx()
69 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx()
72 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx()
75 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx()
D2x16c8-minmax-avx512skx.c78 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx()
82 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx()
86 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx()
90 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx()
D3x16c8-minmax-avx512skx.c90 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx()
95 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx()
100 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx()
105 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx()
D4x16c8-minmax-avx512skx.c102 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx()
108 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx()
114 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx()
120 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx()
/external/XNNPACK/src/qs8-igemm/gen/
D1x16c8-minmax-avx512skx.c75 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx()
78 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx()
81 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx()
84 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx()
D2x16c8-minmax-avx512skx.c89 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx()
93 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx()
97 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx()
101 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx()
D3x16c8-minmax-avx512skx.c103 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx()
108 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx()
113 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx()
118 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx()
D4x16c8-minmax-avx512skx.c117 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx()
123 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx()
129 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx()
135 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx()
/external/XNNPACK/src/qs8-gemm/
DMRx16c8-avx512skx.c.in100 … const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w));
102 …const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_…
/external/XNNPACK/src/qs8-igemm/
DMRx16c8-avx512skx.c.in106 … const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w));
108 …const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_…
/external/llvm-project/clang/lib/Headers/
Davx512bwintrin.h1384 _mm512_cvtepi8_epi16(__m256i __A) in _mm512_cvtepi8_epi16() function
1395 (__v32hi)_mm512_cvtepi8_epi16(__A), in _mm512_mask_cvtepi8_epi16()
1403 (__v32hi)_mm512_cvtepi8_epi16(__A), in _mm512_maskz_cvtepi8_epi16()
/external/clang/test/CodeGen/
Davx512bw-builtins.c1083 return _mm512_cvtepi8_epi16(__A); in test_mm512_cvtepi8_epi16()
/external/llvm-project/clang/test/CodeGen/X86/
Davx512bw-builtins.c1566 return _mm512_cvtepi8_epi16(__A); in test_mm512_cvtepi8_epi16()
/external/clang/lib/Headers/
Davx512bwintrin.h1540 _mm512_cvtepi8_epi16 (__m256i __A) in _mm512_cvtepi8_epi16() function