/external/XNNPACK/src/qs8-gemm/gen/ |
D | 4x16c8-minmax-avx512skx.c | 150 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 151 …const __m512i vprod1x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc1x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 152 …const __m512i vprod2x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc2x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 153 …const __m512i vprod3x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc3x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 155 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 156 …const __m512i vprod1x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc1x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 157 …const __m512i vprod2x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc2x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 158 …const __m512i vprod3x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc3x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 161 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() 163 const __m512i vq31prod1x8C9DAEBF = _mm512_add_epi64(vprod1x8C9DAEBF, vprod1x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_4x16c8__avx512skx() [all …]
|
D | 3x16c8-minmax-avx512skx.c | 130 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 131 …const __m512i vprod1x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc1x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 132 …const __m512i vprod2x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc2x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 134 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 135 …const __m512i vprod1x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc1x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 136 …const __m512i vprod2x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc2x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 139 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 141 const __m512i vq31prod1x8C9DAEBF = _mm512_add_epi64(vprod1x8C9DAEBF, vprod1x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx() 143 const __m512i vq31prod2x8C9DAEBF = _mm512_add_epi64(vprod2x8C9DAEBF, vprod2x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_3x16c8__avx512skx()
|
D | 2x16c8-minmax-avx512skx.c | 110 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 111 …const __m512i vprod1x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc1x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 113 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 114 …const __m512i vprod1x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc1x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 117 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx() 119 const __m512i vq31prod1x8C9DAEBF = _mm512_add_epi64(vprod1x8C9DAEBF, vprod1x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_2x16c8__avx512skx()
|
D | 1x16c8-minmax-avx512skx.c | 90 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx() 92 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx() 95 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_gemm_minmax_ukernel_1x16c8__avx512skx()
|
/external/XNNPACK/src/qs8-igemm/gen/ |
D | 4x16c8-minmax-avx512skx.c | 167 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 168 …const __m512i vprod1x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc1x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 169 …const __m512i vprod2x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc2x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 170 …const __m512i vprod3x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc3x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 172 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 173 …const __m512i vprod1x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc1x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 174 …const __m512i vprod2x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc2x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 175 …const __m512i vprod3x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc3x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 178 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() 180 const __m512i vq31prod1x8C9DAEBF = _mm512_add_epi64(vprod1x8C9DAEBF, vprod1x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_4x16c8__avx512skx() [all …]
|
D | 3x16c8-minmax-avx512skx.c | 145 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 146 …const __m512i vprod1x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc1x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 147 …const __m512i vprod2x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc2x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 149 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 150 …const __m512i vprod1x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc1x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 151 …const __m512i vprod2x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc2x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 154 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 156 const __m512i vq31prod1x8C9DAEBF = _mm512_add_epi64(vprod1x8C9DAEBF, vprod1x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx() 158 const __m512i vq31prod2x8C9DAEBF = _mm512_add_epi64(vprod2x8C9DAEBF, vprod2x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_3x16c8__avx512skx()
|
D | 2x16c8-minmax-avx512skx.c | 123 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 124 …const __m512i vprod1x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc1x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 126 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 127 …const __m512i vprod1x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc1x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 130 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx() 132 const __m512i vq31prod1x8C9DAEBF = _mm512_add_epi64(vprod1x8C9DAEBF, vprod1x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_2x16c8__avx512skx()
|
D | 1x16c8-minmax-avx512skx.c | 101 …const __m512i vprod0x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc0x084C195D2A6E3B7F, vmultipl… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx() 103 …const __m512i vprod0x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc0x88CC99DDAAEEBBFF, vmultipl… in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx() 106 const __m512i vq31prod0x8C9DAEBF = _mm512_add_epi64(vprod0x8C9DAEBF, vprod0x8C9DAEBF); in xnn_qs8_igemm_minmax_ukernel_1x16c8__avx512skx()
|
/external/XNNPACK/src/qs8-dwconv/gen/ |
D | up32x9-minmax-avx512skx-mul32.c | 185 …const __m512i vprod02468ACE = _mm512_add_epi64(_mm512_mul_epi32(vacc0123456789ABCDEF, vmultiplier)… in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 186 …const __m512i vprod13579BDF = _mm512_add_epi64(_mm512_mul_epi32(vacc13579BDF, vmultiplier), vround… in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 187 …const __m512i vprodGIKMOQSU = _mm512_add_epi64(_mm512_mul_epi32(vaccGHIJKLMNOPQRSTUV, vmultiplier)… in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 188 …const __m512i vprodHJLNPRTV = _mm512_add_epi64(_mm512_mul_epi32(vaccHJLNPRTV, vmultiplier), vround… in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 191 const __m512i vq31prod13579BDF = _mm512_add_epi64(vprod13579BDF, vprod13579BDF); in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 193 const __m512i vq31prodHJLNPRTV = _mm512_add_epi64(vprodHJLNPRTV, vprodHJLNPRTV); in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 295 …const __m512i vprod02468ACE = _mm512_add_epi64(_mm512_mul_epi32(vacc0123456789ABCDEF, vmultiplier)… in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 296 …const __m512i vprod13579BDF = _mm512_add_epi64(_mm512_mul_epi32(vacc13579BDF, vmultiplier), vround… in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32() 299 const __m512i vq31prod13579BDF = _mm512_add_epi64(vprod13579BDF, vprod13579BDF); in xnn_qs8_dwconv_minmax_ukernel_up32x9__avx512skx_mul32()
|
D | up16x9-minmax-avx512skx-mul32.c | 155 …const __m512i vprod02468ACE = _mm512_add_epi64(_mm512_mul_epi32(vacc0123456789ABCDEF, vmultiplier)… in xnn_qs8_dwconv_minmax_ukernel_up16x9__avx512skx_mul32() 156 …const __m512i vprod13579BDF = _mm512_add_epi64(_mm512_mul_epi32(vacc13579BDF, vmultiplier), vround… in xnn_qs8_dwconv_minmax_ukernel_up16x9__avx512skx_mul32() 159 const __m512i vq31prod13579BDF = _mm512_add_epi64(vprod13579BDF, vprod13579BDF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__avx512skx_mul32() 237 …const __m512i vprod02468ACE = _mm512_add_epi64(_mm512_mul_epi32(vacc0123456789ABCDEF, vmultiplier)… in xnn_qs8_dwconv_minmax_ukernel_up16x9__avx512skx_mul32() 238 …const __m512i vprod13579BDF = _mm512_add_epi64(_mm512_mul_epi32(vacc13579BDF, vmultiplier), vround… in xnn_qs8_dwconv_minmax_ukernel_up16x9__avx512skx_mul32() 241 const __m512i vq31prod13579BDF = _mm512_add_epi64(vprod13579BDF, vprod13579BDF); in xnn_qs8_dwconv_minmax_ukernel_up16x9__avx512skx_mul32()
|
/external/XNNPACK/src/qs8-dwconv/ |
D | unipass-avx512skx-mul32.c.in | 84 …const __m512i vprod${ABC[C:C+16:2]} = _mm512_add_epi64(_mm512_mul_epi32(vacc${ABC[C:C+16]}, vmulti… 85 …const __m512i vprod${ABC[C+1:C+16:2]} = _mm512_add_epi64(_mm512_mul_epi32(vacc${ABC[C+1:C+16:2]}, … 89 …const __m512i vq31prod${ABC[C+1:C+16:2]} = _mm512_add_epi64(vprod${ABC[C+1:C+16:2]}, vprod${ABC[C+… 172 …const __m512i vprod${ABC[0:16:2]} = _mm512_add_epi64(_mm512_mul_epi32(vacc${ABC[0:16]}, vmultiplie… 173 …const __m512i vprod${ABC[1:16:2]} = _mm512_add_epi64(_mm512_mul_epi32(vacc${ABC[1:16:2]}, vmultipl… 176 … const __m512i vq31prod${ABC[1:16:2]} = _mm512_add_epi64(vprod${ABC[1:16:2]}, vprod${ABC[1:16:2]});
|
/external/XNNPACK/src/qs8-gemm/ |
D | MRx16c8-avx512skx.c.in | 125 …const __m512i vprod${M}x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc${M}x084C195D2A6E3B7F, vm… 128 …const __m512i vprod${M}x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc${M}x88CC99DDAAEEBBFF, vm… 132 … const __m512i vq31prod${M}x8C9DAEBF = _mm512_add_epi64(vprod${M}x8C9DAEBF, vprod${M}x8C9DAEBF);
|
/external/XNNPACK/src/qs8-igemm/ |
D | MRx16c8-avx512skx.c.in | 133 …const __m512i vprod${M}x04152637 = _mm512_add_epi64(_mm512_mul_epi32(vacc${M}x084C195D2A6E3B7F, vm… 136 …const __m512i vprod${M}x8C9DAEBF = _mm512_add_epi64(_mm512_mul_epi32(vacc${M}x88CC99DDAAEEBBFF, vm… 140 … const __m512i vq31prod${M}x8C9DAEBF = _mm512_add_epi64(vprod${M}x8C9DAEBF, vprod${M}x8C9DAEBF);
|
/external/ruy/ruy/ |
D | kernel_avx512.cc | 402 const __m512i r_plus_nudge = _mm512_add_epi64(results, nudge); 443 scaled_v_low = _mm512_add_epi64(scaled_v_low, offset_vector_val); 444 scaled_v_high = _mm512_add_epi64(scaled_v_high, offset_vector_val); 485 scaled_v_low = _mm512_add_epi64(scaled_v_low, offset_vector); 486 scaled_v_high = _mm512_add_epi64(scaled_v_high, offset_vector); 813 const __m512i r_plus_nudge = _mm512_add_epi64(results, nudge); 840 scaled_v_low = _mm512_add_epi64(scaled_v_low, offset_vector); 841 scaled_v_high = _mm512_add_epi64(scaled_v_high, offset_vector);
|
/external/llvm-project/clang/lib/Headers/ |
D | avx512fintrin.h | 852 _mm512_add_epi64 (__m512i __A, __m512i __B) in _mm512_add_epi64() function 861 (__v8di)_mm512_add_epi64(__A, __B), in _mm512_mask_add_epi64() 869 (__v8di)_mm512_add_epi64(__A, __B), in _mm512_maskz_add_epi64()
|
/external/clang/test/CodeGen/ |
D | avx512f-builtins.c | 1661 return _mm512_add_epi64(__A,__B); in test_mm512_add_epi64()
|
/external/llvm-project/clang/test/CodeGen/X86/ |
D | avx512f-builtins.c | 2988 return _mm512_add_epi64(__A,__B); in test_mm512_add_epi64()
|
/external/clang/lib/Headers/ |
D | avx512fintrin.h | 734 _mm512_add_epi64 (__m512i __A, __m512i __B) in _mm512_add_epi64() function
|