Searched refs:_mm512_cvtepi8_epi16 (Results 1 – 16 of 16) sorted by relevance
/external/ruy/ruy/ |
D | pack_avx512.cc | 234 sums_8x4_16bit = _mm512_cvtepi8_epi16(r0_0); 236 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r0_1)); 238 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r1_0)); 240 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r1_1)); 242 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r2_0)); 244 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r2_1)); 246 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r3_0)); 248 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r3_1)); 385 sums_8x4_16bit = _mm512_cvtepi8_epi16(r0_0); 387 _mm512_add_epi16(sums_8x4_16bit, _mm512_cvtepi8_epi16(r0_1)); [all …]
|
D | kernel_avx512.cc | 301 _mm512_cvtepi8_epi16(rhs_data_bottom_lane); 303 _mm512_cvtepi8_epi16(rhs_data_top_lane); 313 _mm512_cvtepi8_epi16(_mm512_cvtepi32_epi16(lhs_data)); 315 const __m512i lhs_16_bit_high = _mm512_cvtepi8_epi16( 745 _mm512_cvtepi8_epi16(_mm512_cvtepi32_epi16(lhs_data)); 747 const __m512i lhs_16_bit_high = _mm512_cvtepi8_epi16(
|
/external/XNNPACK/src/qs8-gemm/gen/ |
D | 1x16c8-minmax-avx512skx.c | 66 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx() 69 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx() 72 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx() 75 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx()
|
D | 2x16c8-minmax-avx512skx.c | 78 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 82 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 86 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 90 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx()
|
D | 3x16c8-minmax-avx512skx.c | 90 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 95 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 100 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 105 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx()
|
D | 4x16c8-minmax-avx512skx.c | 102 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 108 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 114 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 120 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx()
|
/external/XNNPACK/src/qs8-igemm/gen/ |
D | 1x16c8-minmax-avx512skx.c | 75 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx() 78 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx() 81 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx() 84 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx()
|
D | 2x16c8-minmax-avx512skx.c | 89 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 93 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 97 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 101 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx()
|
D | 3x16c8-minmax-avx512skx.c | 103 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 108 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 113 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 118 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx()
|
D | 4x16c8-minmax-avx512skx.c | 117 const __m512i vb0123 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 123 …const __m512i vb4567 = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 32… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 129 …const __m512i vb89AB = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 64… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 135 …const __m512i vbCDEF = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_t) w + 96… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx()
|
/external/XNNPACK/src/qs8-gemm/ |
D | MRx16c8-avx512skx.c.in | 100 … const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); 102 …const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_…
|
/external/XNNPACK/src/qs8-igemm/ |
D | MRx16c8-avx512skx.c.in | 106 … const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) w)); 108 …const __m512i vb${ABC[N:N+4]} = _mm512_cvtepi8_epi16(_mm256_load_si256((const __m256i*) ((uintptr_…
|
/external/llvm-project/clang/lib/Headers/ |
D | avx512bwintrin.h | 1384 _mm512_cvtepi8_epi16(__m256i __A) in _mm512_cvtepi8_epi16() function 1395 (__v32hi)_mm512_cvtepi8_epi16(__A), in _mm512_mask_cvtepi8_epi16() 1403 (__v32hi)_mm512_cvtepi8_epi16(__A), in _mm512_maskz_cvtepi8_epi16()
|
/external/clang/test/CodeGen/ |
D | avx512bw-builtins.c | 1083 return _mm512_cvtepi8_epi16(__A); in test_mm512_cvtepi8_epi16()
|
/external/llvm-project/clang/test/CodeGen/X86/ |
D | avx512bw-builtins.c | 1566 return _mm512_cvtepi8_epi16(__A); in test_mm512_cvtepi8_epi16()
|
/external/clang/lib/Headers/ |
D | avx512bwintrin.h | 1540 _mm512_cvtepi8_epi16 (__m256i __A) in _mm512_cvtepi8_epi16() function
|