Home
last modified time | relevance | path

Searched refs:_mm512_rcp14_ps (Results 1 – 25 of 46) sorted by relevance

12

/external/XNNPACK/src/f32-sigmoid/gen/
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x128.c150 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
151 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
152 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
153 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
154 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
155 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
156 __m512 vr6 = _mm512_rcp14_ps(vd6); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
157 __m512 vr7 = _mm512_rcp14_ps(vd7); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
217 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
252 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x128()
Davx512f-rr1-p5-scalef-nr1fma-x128.c147 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
148 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
149 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
150 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
151 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
152 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
153 __m512 vr6 = _mm512_rcp14_ps(vd6); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
154 __m512 vr7 = _mm512_rcp14_ps(vd7); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
213 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
247 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x128()
Davx512f-rr1-p5-scalef-nr1fma-x96.c123 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
124 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
125 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
126 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
127 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
128 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
179 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
213 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x96()
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x112.c138 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
139 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
140 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
141 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
142 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
143 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
144 __m512 vr6 = _mm512_rcp14_ps(vd6); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
200 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
235 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x112()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x112.c144 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
145 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
146 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
147 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
148 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
149 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
150 __m512 vr6 = _mm512_rcp14_ps(vd6); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
206 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
241 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x112()
Davx512f-rr1-p5-scalef-nr1fma-x112.c135 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
136 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
137 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
138 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
139 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
140 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
141 __m512 vr6 = _mm512_rcp14_ps(vd6); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
196 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
230 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x112()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x128.c156 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
157 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
158 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
159 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
160 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
161 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
162 __m512 vr6 = _mm512_rcp14_ps(vd6); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
163 __m512 vr7 = _mm512_rcp14_ps(vd7); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
223 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
258 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x128()
Davx512f-rr1-p5-scalef-nr1fma-x64.c99 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x64()
100 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x64()
101 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x64()
102 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x64()
145 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x64()
179 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x64()
Davx512f-rr1-p5-scalef-nr1fma-x80.c111 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x80()
112 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x80()
113 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x80()
114 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x80()
115 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x80()
162 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x80()
196 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x80()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x80.c120 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x80()
121 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x80()
122 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x80()
123 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x80()
124 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x80()
172 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x80()
207 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x80()
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x80.c114 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x80()
115 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x80()
116 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x80()
117 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x80()
118 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x80()
166 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x80()
201 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x80()
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x96.c126 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
127 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
128 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
129 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
130 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
131 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
183 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
218 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x96()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x96.c132 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
133 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
134 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
135 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
136 __m512 vr4 = _mm512_rcp14_ps(vd4); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
137 __m512 vr5 = _mm512_rcp14_ps(vd5); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
189 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
224 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x96()
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x64.c102 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x64()
103 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x64()
104 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x64()
105 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x64()
149 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x64()
184 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x64()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x64.c108 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x64()
109 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x64()
110 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x64()
111 __m512 vr3 = _mm512_rcp14_ps(vd3); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x64()
155 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x64()
190 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x64()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x48.c96 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x48()
97 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x48()
98 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x48()
138 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x48()
173 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x48()
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x48.c90 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x48()
91 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x48()
92 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x48()
132 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x48()
167 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x48()
Davx512f-rr1-p5-scalef-nr1fma-x48.c87 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x48()
88 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x48()
89 __m512 vr2 = _mm512_rcp14_ps(vd2); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x48()
128 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x48()
162 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x48()
Davx512f-rr1-p5-scalef-nr1fma-x32.c75 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x32()
76 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x32()
111 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x32()
145 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x32()
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x32.c78 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x32()
79 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x32()
115 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x32()
150 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x32()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x32.c84 __m512 vr0 = _mm512_rcp14_ps(vd0); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x32()
85 __m512 vr1 = _mm512_rcp14_ps(vd1); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x32()
121 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x32()
156 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x32()
Davx512f-rr2-lut32-p2-perm2-scalef-nr1fma-x16.c66 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x16()
101 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr2_lut32_p2_perm2_scalef_nr1fma_x16()
Davx512f-rr1-lut16-p3-perm-scalef-nr1fma-x16.c60 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x16()
95 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_lut16_p3_perm_scalef_nr1fma_x16()
Davx512f-rr1-p5-scalef-nr1fma-x16.c56 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x16()
90 __m512 vr = _mm512_rcp14_ps(vd); in xnn_f32_sigmoid_ukernel__avx512f_rr1_p5_scalef_nr1fma_x16()
/external/XNNPACK/src/f32-sigmoid/
Davx512f-p5-scalef.c.in95 __m512 vr${ABC[N]} = _mm512_rcp14_ps(vd${ABC[N]});
141 __m512 vr = _mm512_rcp14_ps(vd);
184 __m512 vr = _mm512_rcp14_ps(vd);

12