Home
last modified time | relevance | path

Searched refs:_mm512_fmsub_ps (Results 1 – 22 of 22) sorted by relevance

/external/XNNPACK/src/f32-velu/gen/
Dvelu-avx512f-rr1-lut16-p3-perm-x128.c140 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
141 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
142 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
143 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
144 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
145 vs5 = _mm512_fmsub_ps(vs5, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
146 vs6 = _mm512_fmsub_ps(vs6, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
147 vs7 = _mm512_fmsub_ps(vs7, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
214 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
247 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x128()
Dvelu-avx512f-rr1-lut16-p3-perm-x112.c129 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
130 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
131 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
132 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
133 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
134 vs5 = _mm512_fmsub_ps(vs5, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
135 vs6 = _mm512_fmsub_ps(vs6, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
197 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
230 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x112()
Dvelu-avx512f-rr1-p6-x128.c150 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
151 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
152 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
153 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
154 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
155 vs5 = _mm512_fmsub_ps(vs5, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
156 vs6 = _mm512_fmsub_ps(vs6, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
157 vs7 = _mm512_fmsub_ps(vs7, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
225 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
259 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x128()
Dvelu-avx512f-rr1-lut16-p3-perm-x80.c107 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x80()
108 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x80()
109 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x80()
110 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x80()
111 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x80()
163 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x80()
196 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x80()
Dvelu-avx512f-rr1-lut16-p3-perm-x96.c118 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
119 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
120 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
121 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
122 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
123 vs5 = _mm512_fmsub_ps(vs5, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
180 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
213 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x96()
Dvelu-avx512f-rr1-p6-x96.c126 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
127 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
128 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
129 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
130 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
131 vs5 = _mm512_fmsub_ps(vs5, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
189 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
223 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x96()
Dvelu-avx512f-rr1-p6-x112.c138 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
139 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
140 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
141 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
142 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
143 vs5 = _mm512_fmsub_ps(vs5, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
144 vs6 = _mm512_fmsub_ps(vs6, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
207 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
241 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x112()
Dvelu-avx512f-rr1-p6-x80.c114 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x80()
115 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x80()
116 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x80()
117 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x80()
118 vs4 = _mm512_fmsub_ps(vs4, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x80()
171 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x80()
205 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x80()
Dvelu-avx512f-rr1-p6-x64.c102 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x64()
103 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x64()
104 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x64()
105 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x64()
153 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x64()
187 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x64()
Dvelu-avx512f-rr1-lut16-p3-perm-x64.c96 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x64()
97 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x64()
98 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x64()
99 vs3 = _mm512_fmsub_ps(vs3, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x64()
146 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x64()
179 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x64()
Dvelu-avx512f-rr1-lut16-p3-perm-x48.c85 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x48()
86 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x48()
87 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x48()
129 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x48()
162 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x48()
Dvelu-avx512f-rr1-p6-x48.c90 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x48()
91 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x48()
92 vs2 = _mm512_fmsub_ps(vs2, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x48()
135 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x48()
169 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x48()
Dvelu-avx512f-rr1-lut16-p3-perm-x32.c74 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x32()
75 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x32()
112 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x32()
145 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x32()
Dvelu-avx512f-rr1-p6-x32.c78 vs0 = _mm512_fmsub_ps(vs0, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x32()
79 vs1 = _mm512_fmsub_ps(vs1, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x32()
117 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x32()
151 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x32()
Dvelu-avx512f-rr1-lut16-p3-perm-x16.c61 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x16()
94 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_lut16_p3_perm_x16()
Dvelu-avx512f-rr1-p6-x16.c62 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x16()
96 vs = _mm512_fmsub_ps(vs, valpha, valpha); in xnn_f32_velu_ukernel__avx512f_rr1_p6_x16()
/external/XNNPACK/src/f32-velu/
Davx512f-rr1-lut16-p3-perm.c.in73 vs${N} = _mm512_fmsub_ps(vs${N}, valpha, valpha);
110 vs = _mm512_fmsub_ps(vs, valpha, valpha);
143 vs = _mm512_fmsub_ps(vs, valpha, valpha);
Davx512f-rr1-p6.c.in78 vs${N} = _mm512_fmsub_ps(vs${N}, valpha, valpha);
116 vs = _mm512_fmsub_ps(vs, valpha, valpha);
150 vs = _mm512_fmsub_ps(vs, valpha, valpha);
/external/clang/test/CodeGen/
Davx512f-builtins.c641 return _mm512_fmsub_ps(__A, __B, __C); in test_mm512_fmsub_ps()
/external/llvm-project/clang/test/CodeGen/X86/
Davx512f-builtins.c784 return _mm512_fmsub_ps(__A, __B, __C); in test_mm512_fmsub_ps()
/external/clang/lib/Headers/
Davx512fintrin.h2889 _mm512_fmsub_ps(__m512 __A, __m512 __B, __m512 __C) in _mm512_fmsub_ps() function
/external/llvm-project/clang/lib/Headers/
Davx512fintrin.h2756 _mm512_fmsub_ps(__m512 __A, __m512 __B, __m512 __C) in _mm512_fmsub_ps() function