Lines Matching refs:params

53   union xnn_qu8_gemm_params params;  in xnn_init_scalar_qu8_gemm_params()  local
54 params.scalar.kernel_zero_point = (int32_t) (uint32_t) kernel_zero_point; in xnn_init_scalar_qu8_gemm_params()
55 params.scalar.multiplier = multiplier; in xnn_init_scalar_qu8_gemm_params()
56 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_scalar_qu8_gemm_params()
57 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_scalar_qu8_gemm_params()
58 params.scalar.shift = (uint32_t) shift; in xnn_init_scalar_qu8_gemm_params()
59 params.scalar.output_min_less_zero_point = in xnn_init_scalar_qu8_gemm_params()
61 params.scalar.output_max_less_zero_point = in xnn_init_scalar_qu8_gemm_params()
63 params.scalar.output_zero_point = (int32_t) (uint32_t) output_zero_point; in xnn_init_scalar_qu8_gemm_params()
64 return params; in xnn_init_scalar_qu8_gemm_params()
87 union xnn_qu8_gemm_params params; in xnn_init_qu8_gemm_params() local
92 params.sse2.kernel_zero_point[i] = (int16_t) (uint16_t) kernel_zero_point; in xnn_init_qu8_gemm_params()
94 params.sse2.multiplier[0] = multiplier; in xnn_init_qu8_gemm_params()
95 params.sse2.multiplier[1] = multiplier; in xnn_init_qu8_gemm_params()
96 params.sse2.multiplier[2] = multiplier; in xnn_init_qu8_gemm_params()
97 params.sse2.multiplier[3] = multiplier; in xnn_init_qu8_gemm_params()
98 params.sse2.rounding[0] = UINT64_C(0x40000000); in xnn_init_qu8_gemm_params()
99 params.sse2.rounding[1] = UINT64_C(0x40000000); in xnn_init_qu8_gemm_params()
100 params.sse2.remainder_mask[0] = (int32_t) remainder_mask; in xnn_init_qu8_gemm_params()
101 params.sse2.remainder_mask[1] = (int32_t) remainder_mask; in xnn_init_qu8_gemm_params()
102 params.sse2.remainder_mask[2] = (int32_t) remainder_mask; in xnn_init_qu8_gemm_params()
103 params.sse2.remainder_mask[3] = (int32_t) remainder_mask; in xnn_init_qu8_gemm_params()
104 params.sse2.remainder_threshold[0] = (int32_t) remainder_threshold; in xnn_init_qu8_gemm_params()
105 params.sse2.remainder_threshold[1] = (int32_t) remainder_threshold; in xnn_init_qu8_gemm_params()
106 params.sse2.remainder_threshold[2] = (int32_t) remainder_threshold; in xnn_init_qu8_gemm_params()
107 params.sse2.remainder_threshold[3] = (int32_t) remainder_threshold; in xnn_init_qu8_gemm_params()
108 params.sse2.shift[0] = (uint64_t) (uint32_t) shift; in xnn_init_qu8_gemm_params()
109 params.sse2.shift[1] = (uint64_t) (uint32_t) shift; in xnn_init_qu8_gemm_params()
111 params.sse2.output_zero_point[i] = (int16_t) (uint16_t) output_zero_point; in xnn_init_qu8_gemm_params()
114 params.sse2.output_min[i] = output_min; in xnn_init_qu8_gemm_params()
115 params.sse2.output_max[i] = output_max; in xnn_init_qu8_gemm_params()
118 params.neon.kernel_zero_point = (int32_t) (uint32_t) kernel_zero_point; in xnn_init_qu8_gemm_params()
119 params.neon.multiplier = multiplier; in xnn_init_qu8_gemm_params()
120 params.neon.right_shift = -shift; in xnn_init_qu8_gemm_params()
121 params.neon.output_zero_point = (int16_t) (uint16_t) output_zero_point; in xnn_init_qu8_gemm_params()
122 params.neon.output_min = output_min; in xnn_init_qu8_gemm_params()
123 params.neon.output_max = output_max; in xnn_init_qu8_gemm_params()
127 params.scalar.kernel_zero_point = (int32_t) (uint32_t) kernel_zero_point; in xnn_init_qu8_gemm_params()
128 params.scalar.multiplier = multiplier; in xnn_init_qu8_gemm_params()
129 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_qu8_gemm_params()
130 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_qu8_gemm_params()
131 params.scalar.shift = (uint32_t) shift; in xnn_init_qu8_gemm_params()
132 params.scalar.output_min_less_zero_point = in xnn_init_qu8_gemm_params()
134 params.scalar.output_max_less_zero_point = in xnn_init_qu8_gemm_params()
136 params.scalar.output_zero_point = (int32_t) (uint32_t) output_zero_point; in xnn_init_qu8_gemm_params()
138 return params; in xnn_init_qu8_gemm_params()
163 union xnn_qs8_gemm_params params; in xnn_init_scalar_qs8_gemm_params() local
164 params.scalar.multiplier = multiplier; in xnn_init_scalar_qs8_gemm_params()
165 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_scalar_qs8_gemm_params()
166 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_scalar_qs8_gemm_params()
167 params.scalar.shift = (uint32_t) shift; in xnn_init_scalar_qs8_gemm_params()
168 params.scalar.output_min_less_zero_point = (int32_t) output_min - (int32_t) output_zero_point; in xnn_init_scalar_qs8_gemm_params()
169 params.scalar.output_max_less_zero_point = (int32_t) output_max - (int32_t) output_zero_point; in xnn_init_scalar_qs8_gemm_params()
170 params.scalar.output_zero_point = (int32_t) output_zero_point; in xnn_init_scalar_qs8_gemm_params()
171 return params; in xnn_init_scalar_qs8_gemm_params()
193 union xnn_qs8_gemm_params params; in xnn_init_qs8_gemm_params() local
197 params.sse2.multiplier[0] = multiplier; in xnn_init_qs8_gemm_params()
198 params.sse2.multiplier[1] = multiplier; in xnn_init_qs8_gemm_params()
199 params.sse2.multiplier[2] = multiplier; in xnn_init_qs8_gemm_params()
200 params.sse2.multiplier[3] = multiplier; in xnn_init_qs8_gemm_params()
201 params.sse2.rounding[0] = UINT64_C(0x40000000); in xnn_init_qs8_gemm_params()
202 params.sse2.rounding[1] = UINT64_C(0x40000000); in xnn_init_qs8_gemm_params()
203 params.sse2.remainder_mask[0] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
204 params.sse2.remainder_mask[1] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
205 params.sse2.remainder_mask[2] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
206 params.sse2.remainder_mask[3] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
207 params.sse2.remainder_threshold[0] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
208 params.sse2.remainder_threshold[1] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
209 params.sse2.remainder_threshold[2] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
210 params.sse2.remainder_threshold[3] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
211 params.sse2.shift[0] = (uint64_t) (uint32_t) shift; in xnn_init_qs8_gemm_params()
212 params.sse2.shift[1] = (uint64_t) (uint32_t) shift; in xnn_init_qs8_gemm_params()
214 params.sse2.output_zero_point[i] = (int16_t) output_zero_point; in xnn_init_qs8_gemm_params()
215 params.sse2.output_min[i] = (int16_t) output_min; in xnn_init_qs8_gemm_params()
216 params.sse2.output_max[i] = (int16_t) output_max; in xnn_init_qs8_gemm_params()
219 params.neon.multiplier = multiplier; in xnn_init_qs8_gemm_params()
220 params.neon.right_shift = -shift; in xnn_init_qs8_gemm_params()
221 params.neon.output_zero_point = (int16_t) output_zero_point; in xnn_init_qs8_gemm_params()
222 params.neon.output_min = output_min; in xnn_init_qs8_gemm_params()
223 params.neon.output_max = output_max; in xnn_init_qs8_gemm_params()
228 params.wasmsimd.multiplier[0] = twice_multiplier; in xnn_init_qs8_gemm_params()
229 params.wasmsimd.multiplier[1] = twice_multiplier; in xnn_init_qs8_gemm_params()
230 params.wasmsimd.rounding[0] = INT64_C(0x80000000); in xnn_init_qs8_gemm_params()
231 params.wasmsimd.rounding[1] = INT64_C(0x80000000); in xnn_init_qs8_gemm_params()
232 params.wasmsimd.remainder_mask[0] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
233 params.wasmsimd.remainder_mask[1] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
234 params.wasmsimd.remainder_mask[2] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
235 params.wasmsimd.remainder_mask[3] = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
236 params.wasmsimd.remainder_threshold[0] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
237 params.wasmsimd.remainder_threshold[1] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
238 params.wasmsimd.remainder_threshold[2] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
239 params.wasmsimd.remainder_threshold[3] = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
240 params.wasmsimd.shift = shift; in xnn_init_qs8_gemm_params()
242 params.wasmsimd.output_zero_point[i] = (int16_t) output_zero_point; in xnn_init_qs8_gemm_params()
245 params.wasmsimd.output_min[i] = output_min; in xnn_init_qs8_gemm_params()
246 params.wasmsimd.output_max[i] = output_max; in xnn_init_qs8_gemm_params()
251 params.scalar.multiplier = multiplier; in xnn_init_qs8_gemm_params()
252 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_qs8_gemm_params()
253 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_qs8_gemm_params()
254 params.scalar.shift = (uint32_t) shift; in xnn_init_qs8_gemm_params()
255 params.scalar.output_min_less_zero_point = (int32_t) output_min - (int32_t) output_zero_point; in xnn_init_qs8_gemm_params()
256 params.scalar.output_max_less_zero_point = (int32_t) output_max - (int32_t) output_zero_point; in xnn_init_qs8_gemm_params()
257 params.scalar.output_zero_point = (int32_t) output_zero_point; in xnn_init_qs8_gemm_params()
259 return params; in xnn_init_qs8_gemm_params()
271 } params; in xnn_init_scalar_qs8_gemm_xw_params() local
272 params.gemm = xnn_init_scalar_qs8_gemm_params(scale, output_zero_point, output_min, output_max); in xnn_init_scalar_qs8_gemm_xw_params()
273 return params.gemm_xw; in xnn_init_scalar_qs8_gemm_xw_params()
285 } params; in xnn_init_qs8_gemm_xw_params() local
286 params.gemm = xnn_init_qs8_gemm_params(scale, output_zero_point, output_min, output_max); in xnn_init_qs8_gemm_xw_params()
287 return params.gemm_xw; in xnn_init_qs8_gemm_xw_params()
312 union xnn_qu8_avgpool_params params; in xnn_init_qu8_avgpool_params() local
316 params.sse2.bias[0] = bias; in xnn_init_qu8_avgpool_params()
317 params.sse2.bias[1] = bias; in xnn_init_qu8_avgpool_params()
318 params.sse2.bias[2] = bias; in xnn_init_qu8_avgpool_params()
319 params.sse2.bias[3] = bias; in xnn_init_qu8_avgpool_params()
320 params.sse2.multiplier[0] = (uint32_t) multiplier; in xnn_init_qu8_avgpool_params()
321 params.sse2.multiplier[1] = (uint32_t) multiplier; in xnn_init_qu8_avgpool_params()
322 params.sse2.multiplier[2] = (uint32_t) multiplier; in xnn_init_qu8_avgpool_params()
323 params.sse2.multiplier[3] = (uint32_t) multiplier; in xnn_init_qu8_avgpool_params()
324 params.sse2.rounding[0] = rounding; in xnn_init_qu8_avgpool_params()
325 params.sse2.rounding[1] = rounding; in xnn_init_qu8_avgpool_params()
326 params.sse2.right_shift[0] = (uint64_t) right_shift; in xnn_init_qu8_avgpool_params()
327 params.sse2.right_shift[1] = (uint64_t) right_shift; in xnn_init_qu8_avgpool_params()
329 params.sse2.output_zero_point[i] = (int16_t) (uint16_t) output_zero_point; in xnn_init_qu8_avgpool_params()
332 params.sse2.output_min[i] = output_min; in xnn_init_qu8_avgpool_params()
333 params.sse2.output_max[i] = output_max; in xnn_init_qu8_avgpool_params()
336 params.neon.bias = bias; in xnn_init_qu8_avgpool_params()
337 params.neon.multiplier = multiplier; in xnn_init_qu8_avgpool_params()
338 params.neon.left_shift = (int64_t) -shift; in xnn_init_qu8_avgpool_params()
339 params.neon.output_zero_point = (int16_t) (uint16_t) output_zero_point; in xnn_init_qu8_avgpool_params()
340 params.neon.output_min = output_min; in xnn_init_qu8_avgpool_params()
341 params.neon.output_max = output_max; in xnn_init_qu8_avgpool_params()
345 params.scalar.bias = bias; in xnn_init_qu8_avgpool_params()
346 params.scalar.multiplier = multiplier; in xnn_init_qu8_avgpool_params()
347 params.scalar.rounding = rounding; in xnn_init_qu8_avgpool_params()
348 params.scalar.right_shift = right_shift; in xnn_init_qu8_avgpool_params()
349 params.scalar.output_min_less_zero_point = in xnn_init_qu8_avgpool_params()
351 params.scalar.output_max_less_zero_point = in xnn_init_qu8_avgpool_params()
353 params.scalar.output_zero_point = (int32_t) (uint32_t) output_zero_point; in xnn_init_qu8_avgpool_params()
355 return params; in xnn_init_qu8_avgpool_params()
380 union xnn_qu8_avgpool_params params; in xnn_init_scalar_qu8_avgpool_params() local
383 params.scalar.bias = bias; in xnn_init_scalar_qu8_avgpool_params()
384 params.scalar.rounding = rounding; in xnn_init_scalar_qu8_avgpool_params()
385 params.scalar.multiplier = multiplier; in xnn_init_scalar_qu8_avgpool_params()
386 params.scalar.right_shift = right_shift; in xnn_init_scalar_qu8_avgpool_params()
387 params.scalar.output_min_less_zero_point = in xnn_init_scalar_qu8_avgpool_params()
389 params.scalar.output_max_less_zero_point = in xnn_init_scalar_qu8_avgpool_params()
391 params.scalar.output_zero_point = (int32_t) (uint32_t) output_zero_point; in xnn_init_scalar_qu8_avgpool_params()
392 return params; in xnn_init_scalar_qu8_avgpool_params()
396 union xnn_qu8_avgpool_params* params, in xnn_update_qu8_avgpool_params() argument
417 params->sse2.bias[0] = bias; in xnn_update_qu8_avgpool_params()
418 params->sse2.bias[1] = bias; in xnn_update_qu8_avgpool_params()
419 params->sse2.bias[2] = bias; in xnn_update_qu8_avgpool_params()
420 params->sse2.bias[3] = bias; in xnn_update_qu8_avgpool_params()
421 params->sse2.multiplier[0] = (uint32_t) multiplier; in xnn_update_qu8_avgpool_params()
422 params->sse2.multiplier[1] = (uint32_t) multiplier; in xnn_update_qu8_avgpool_params()
423 params->sse2.multiplier[2] = (uint32_t) multiplier; in xnn_update_qu8_avgpool_params()
424 params->sse2.multiplier[3] = (uint32_t) multiplier; in xnn_update_qu8_avgpool_params()
425 params->sse2.rounding[0] = rounding; in xnn_update_qu8_avgpool_params()
426 params->sse2.rounding[1] = rounding; in xnn_update_qu8_avgpool_params()
427 params->sse2.right_shift[0] = (uint64_t) (uint32_t) shift; in xnn_update_qu8_avgpool_params()
428 params->sse2.right_shift[1] = (uint64_t) (uint32_t) shift; in xnn_update_qu8_avgpool_params()
430 params->neon.bias = bias; in xnn_update_qu8_avgpool_params()
431 params->neon.multiplier = multiplier; in xnn_update_qu8_avgpool_params()
432 params->neon.left_shift = (int64_t) -shift; in xnn_update_qu8_avgpool_params()
435 params->scalar.bias = bias; in xnn_update_qu8_avgpool_params()
436 params->scalar.multiplier = multiplier; in xnn_update_qu8_avgpool_params()
437 params->scalar.rounding = rounding; in xnn_update_qu8_avgpool_params()
438 params->scalar.right_shift = (uint32_t) shift; in xnn_update_qu8_avgpool_params()
464 union xnn_qs8_avgpool_params params; in xnn_init_qs8_avgpool_params() local
467 params.sse2.bias[0] = bias; in xnn_init_qs8_avgpool_params()
468 params.sse2.bias[1] = bias; in xnn_init_qs8_avgpool_params()
469 params.sse2.bias[2] = bias; in xnn_init_qs8_avgpool_params()
470 params.sse2.bias[3] = bias; in xnn_init_qs8_avgpool_params()
471 params.sse2.multiplier[0] = (uint32_t) multiplier; in xnn_init_qs8_avgpool_params()
472 params.sse2.multiplier[1] = (uint32_t) multiplier; in xnn_init_qs8_avgpool_params()
473 params.sse2.multiplier[2] = (uint32_t) multiplier; in xnn_init_qs8_avgpool_params()
474 params.sse2.multiplier[3] = (uint32_t) multiplier; in xnn_init_qs8_avgpool_params()
475 params.sse2.rounding[0] = rounding; in xnn_init_qs8_avgpool_params()
476 params.sse2.rounding[1] = rounding; in xnn_init_qs8_avgpool_params()
477 params.sse2.shift[0] = (uint64_t) (uint32_t) shift; in xnn_init_qs8_avgpool_params()
478 params.sse2.shift[1] = (uint64_t) (uint32_t) shift; in xnn_init_qs8_avgpool_params()
480 params.sse2.output_zero_point[i] = (int16_t) output_zero_point; in xnn_init_qs8_avgpool_params()
481 params.sse2.output_min[i] = (int16_t) output_min; in xnn_init_qs8_avgpool_params()
482 params.sse2.output_max[i] = (int16_t) output_max; in xnn_init_qs8_avgpool_params()
485 params.neon.bias = bias; in xnn_init_qs8_avgpool_params()
486 params.neon.multiplier = multiplier; in xnn_init_qs8_avgpool_params()
487 params.neon.left_shift = (int64_t) -shift; in xnn_init_qs8_avgpool_params()
488 params.neon.output_zero_point = (int16_t) output_zero_point; in xnn_init_qs8_avgpool_params()
489 params.neon.output_min = output_min; in xnn_init_qs8_avgpool_params()
490 params.neon.output_max = output_max; in xnn_init_qs8_avgpool_params()
493 params.wasmsimd.bias[0] = bias; in xnn_init_qs8_avgpool_params()
494 params.wasmsimd.bias[1] = bias; in xnn_init_qs8_avgpool_params()
495 params.wasmsimd.bias[2] = bias; in xnn_init_qs8_avgpool_params()
496 params.wasmsimd.bias[3] = bias; in xnn_init_qs8_avgpool_params()
497 params.wasmsimd.multiplier[0] = (int64_t) multiplier; in xnn_init_qs8_avgpool_params()
498 params.wasmsimd.multiplier[1] = (int64_t) multiplier; in xnn_init_qs8_avgpool_params()
499 params.wasmsimd.rounding[0] = rounding; in xnn_init_qs8_avgpool_params()
500 params.wasmsimd.rounding[1] = rounding; in xnn_init_qs8_avgpool_params()
501 params.wasmsimd.shift = shift; in xnn_init_qs8_avgpool_params()
503 params.wasmsimd.output_zero_point[i] = (int16_t) output_zero_point; in xnn_init_qs8_avgpool_params()
506 params.wasmsimd.output_min[i] = output_min; in xnn_init_qs8_avgpool_params()
507 params.wasmsimd.output_max[i] = output_max; in xnn_init_qs8_avgpool_params()
511 params.scalar.bias = bias; in xnn_init_qs8_avgpool_params()
512 params.scalar.multiplier = multiplier; in xnn_init_qs8_avgpool_params()
513 params.scalar.rounding = rounding; in xnn_init_qs8_avgpool_params()
514 params.scalar.shift = (uint32_t) shift; in xnn_init_qs8_avgpool_params()
515 params.scalar.output_min_less_zero_point = (int32_t) output_min - (int32_t) output_zero_point; in xnn_init_qs8_avgpool_params()
516 params.scalar.output_max_less_zero_point = (int32_t) output_max - (int32_t) output_zero_point; in xnn_init_qs8_avgpool_params()
517 params.scalar.output_zero_point = (int32_t) output_zero_point; in xnn_init_qs8_avgpool_params()
519 return params; in xnn_init_qs8_avgpool_params()
544 union xnn_qs8_avgpool_params params; in xnn_init_scalar_qs8_avgpool_params() local
546 params.scalar.bias = bias; in xnn_init_scalar_qs8_avgpool_params()
547 params.scalar.rounding = rounding; in xnn_init_scalar_qs8_avgpool_params()
548 params.scalar.multiplier = multiplier; in xnn_init_scalar_qs8_avgpool_params()
549 params.scalar.shift = shift; in xnn_init_scalar_qs8_avgpool_params()
550 params.scalar.output_min_less_zero_point = (int32_t) output_min - (int32_t) output_zero_point; in xnn_init_scalar_qs8_avgpool_params()
551 params.scalar.output_max_less_zero_point = (int32_t) output_max - (int32_t) output_zero_point; in xnn_init_scalar_qs8_avgpool_params()
552 params.scalar.output_zero_point = (int32_t) output_zero_point; in xnn_init_scalar_qs8_avgpool_params()
553 return params; in xnn_init_scalar_qs8_avgpool_params()
557 union xnn_qs8_avgpool_params* params, in xnn_update_qs8_avgpool_params() argument
578 params->sse2.bias[0] = bias; in xnn_update_qs8_avgpool_params()
579 params->sse2.bias[1] = bias; in xnn_update_qs8_avgpool_params()
580 params->sse2.bias[2] = bias; in xnn_update_qs8_avgpool_params()
581 params->sse2.bias[3] = bias; in xnn_update_qs8_avgpool_params()
582 params->sse2.multiplier[0] = (uint32_t) multiplier; in xnn_update_qs8_avgpool_params()
583 params->sse2.multiplier[1] = (uint32_t) multiplier; in xnn_update_qs8_avgpool_params()
584 params->sse2.multiplier[2] = (uint32_t) multiplier; in xnn_update_qs8_avgpool_params()
585 params->sse2.multiplier[3] = (uint32_t) multiplier; in xnn_update_qs8_avgpool_params()
586 params->sse2.rounding[0] = rounding; in xnn_update_qs8_avgpool_params()
587 params->sse2.rounding[1] = rounding; in xnn_update_qs8_avgpool_params()
588 params->sse2.shift[0] = (uint64_t) (uint32_t) shift; in xnn_update_qs8_avgpool_params()
589 params->sse2.shift[1] = (uint64_t) (uint32_t) shift; in xnn_update_qs8_avgpool_params()
591 params->neon.bias = bias; in xnn_update_qs8_avgpool_params()
592 params->neon.multiplier = multiplier; in xnn_update_qs8_avgpool_params()
593 params->neon.left_shift = (int64_t) -shift; in xnn_update_qs8_avgpool_params()
596 params->wasmsimd.bias[0] = bias; in xnn_update_qs8_avgpool_params()
597 params->wasmsimd.bias[1] = bias; in xnn_update_qs8_avgpool_params()
598 params->wasmsimd.bias[2] = bias; in xnn_update_qs8_avgpool_params()
599 params->wasmsimd.bias[3] = bias; in xnn_update_qs8_avgpool_params()
600 params->wasmsimd.multiplier[0] = (int64_t) multiplier; in xnn_update_qs8_avgpool_params()
601 params->wasmsimd.multiplier[1] = (int64_t) multiplier; in xnn_update_qs8_avgpool_params()
602 params->wasmsimd.rounding[0] = rounding; in xnn_update_qs8_avgpool_params()
603 params->wasmsimd.rounding[1] = rounding; in xnn_update_qs8_avgpool_params()
604 params->wasmsimd.shift = shift; in xnn_update_qs8_avgpool_params()
607 params->scalar.bias = bias; in xnn_update_qs8_avgpool_params()
608 params->scalar.multiplier = multiplier; in xnn_update_qs8_avgpool_params()
609 params->scalar.rounding = rounding; in xnn_update_qs8_avgpool_params()
610 params->scalar.shift = (uint32_t) shift; in xnn_update_qs8_avgpool_params()
615 struct xnn_f16_scaleminmax_params* params, in xnn_update_f16_scaleminmax_params() argument
618 params->scale = scale; in xnn_update_f16_scaleminmax_params()
622 union xnn_f32_scaleminmax_params* params, in xnn_update_f32_scaleminmax_params() argument
627 params->sse2.scale[i] = scale; in xnn_update_f32_scaleminmax_params()
630 params->scalar.scale = scale; in xnn_update_f32_scaleminmax_params()
639 struct xnn_f16_scaleminmax_params params; in xnn_init_f16_scaleminmax_params() local
640 params.scale = scale; in xnn_init_f16_scaleminmax_params()
641 params.min = min; in xnn_init_f16_scaleminmax_params()
642 params.max = max; in xnn_init_f16_scaleminmax_params()
643 return params; in xnn_init_f16_scaleminmax_params()
651 union xnn_f32_scaleminmax_params params; in xnn_init_f32_scaleminmax_params() local
654 params.sse2.scale[i] = scale; in xnn_init_f32_scaleminmax_params()
655 params.sse2.min[i] = min; in xnn_init_f32_scaleminmax_params()
656 params.sse2.max[i] = max; in xnn_init_f32_scaleminmax_params()
659 params.scalar.scale = scale; in xnn_init_f32_scaleminmax_params()
660 params.scalar.min = min; in xnn_init_f32_scaleminmax_params()
661 params.scalar.max = max; in xnn_init_f32_scaleminmax_params()
663 return params; in xnn_init_f32_scaleminmax_params()
672 union xnn_f32_gavgpool_params params; in xnn_init_f32_gavgpool_params() local
675 params.sse.multiplier[i] = multiplier; in xnn_init_f32_gavgpool_params()
676 params.sse.output_min[i] = output_min; in xnn_init_f32_gavgpool_params()
677 params.sse.output_max[i] = output_max; in xnn_init_f32_gavgpool_params()
681 params.sse.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_gavgpool_params()
682 params.sse.mask[1] = -(uint32_t) (w >= 1); in xnn_init_f32_gavgpool_params()
683 params.sse.mask[2] = -(uint32_t) (w >= 2); in xnn_init_f32_gavgpool_params()
684 params.sse.mask[3] = -(uint32_t) (w >= 3); in xnn_init_f32_gavgpool_params()
686 params.neon.multiplier = multiplier; in xnn_init_f32_gavgpool_params()
687 params.neon.output_min = output_min; in xnn_init_f32_gavgpool_params()
688 params.neon.output_max = output_max; in xnn_init_f32_gavgpool_params()
691 params.neon.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_gavgpool_params()
692 params.neon.mask[1] = -(uint32_t) (w >= 1); in xnn_init_f32_gavgpool_params()
693 params.neon.mask[2] = -(uint32_t) (w >= 2); in xnn_init_f32_gavgpool_params()
694 params.neon.mask[3] = -(uint32_t) (w >= 3); in xnn_init_f32_gavgpool_params()
696 params.scalar.multiplier = multiplier; in xnn_init_f32_gavgpool_params()
697 params.scalar.output_min = output_min; in xnn_init_f32_gavgpool_params()
698 params.scalar.output_max = output_max; in xnn_init_f32_gavgpool_params()
701 params.scalar.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_gavgpool_params()
702 params.scalar.mask[1] = -(int32_t) (w >= 1); in xnn_init_f32_gavgpool_params()
703 params.scalar.mask[2] = -(int32_t) (w >= 2); in xnn_init_f32_gavgpool_params()
704 params.scalar.mask[3] = -(int32_t) (w >= 3); in xnn_init_f32_gavgpool_params()
706 return params; in xnn_init_f32_gavgpool_params()
710 union xnn_f32_gavgpool_params* params, in xnn_update_f32_gavgpool_params() argument
716 params->sse.multiplier[i] = multiplier; in xnn_update_f32_gavgpool_params()
720 params->sse.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_gavgpool_params()
721 params->sse.mask[1] = -(uint32_t) (w >= 1); in xnn_update_f32_gavgpool_params()
722 params->sse.mask[2] = -(uint32_t) (w >= 2); in xnn_update_f32_gavgpool_params()
723 params->sse.mask[3] = -(uint32_t) (w >= 3); in xnn_update_f32_gavgpool_params()
725 params->neon.multiplier = multiplier; in xnn_update_f32_gavgpool_params()
728 params->neon.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_gavgpool_params()
729 params->neon.mask[1] = -(uint32_t) (w >= 1); in xnn_update_f32_gavgpool_params()
730 params->neon.mask[2] = -(uint32_t) (w >= 2); in xnn_update_f32_gavgpool_params()
731 params->neon.mask[3] = -(uint32_t) (w >= 3); in xnn_update_f32_gavgpool_params()
733 params->scalar.multiplier = multiplier; in xnn_update_f32_gavgpool_params()
736 params->scalar.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_gavgpool_params()
737 params->scalar.mask[1] = -(int32_t) (w >= 1); in xnn_update_f32_gavgpool_params()
738 params->scalar.mask[2] = -(int32_t) (w >= 2); in xnn_update_f32_gavgpool_params()
739 params->scalar.mask[3] = -(int32_t) (w >= 3); in xnn_update_f32_gavgpool_params()
748 union xnn_f32_scaleminmax_params params; in xnn_init_scalar_f32_scaleminmax_params() local
749 params.scalar.scale = scale; in xnn_init_scalar_f32_scaleminmax_params()
750 params.scalar.min = min; in xnn_init_scalar_f32_scaleminmax_params()
751 params.scalar.max = max; in xnn_init_scalar_f32_scaleminmax_params()
752 return params; in xnn_init_scalar_f32_scaleminmax_params()
761 union xnn_f32_gavgpool_params params; in xnn_init_scalar_f32_gavgpool_params() local
762 params.scalar.multiplier = multiplier; in xnn_init_scalar_f32_gavgpool_params()
763 params.scalar.output_min = output_min; in xnn_init_scalar_f32_gavgpool_params()
764 params.scalar.output_max = output_max; in xnn_init_scalar_f32_gavgpool_params()
767 params.scalar.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_scalar_f32_gavgpool_params()
768 params.scalar.mask[1] = -(int32_t) (w >= 1); in xnn_init_scalar_f32_gavgpool_params()
769 params.scalar.mask[2] = -(int32_t) (w >= 2); in xnn_init_scalar_f32_gavgpool_params()
770 params.scalar.mask[3] = -(int32_t) (w >= 3); in xnn_init_scalar_f32_gavgpool_params()
771 return params; in xnn_init_scalar_f32_gavgpool_params()
778 struct xnn_f16_minmax_params params; in xnn_init_f16_minmax_params() local
779 params.min = min; in xnn_init_f16_minmax_params()
780 params.max = max; in xnn_init_f16_minmax_params()
781 return params; in xnn_init_f16_minmax_params()
788 union xnn_f32_minmax_params params; in xnn_init_f32_minmax_params() local
791 params.sse.min[i] = output_min; in xnn_init_f32_minmax_params()
792 params.sse.max[i] = output_max; in xnn_init_f32_minmax_params()
795 params.scalar.min = output_min; in xnn_init_f32_minmax_params()
796 params.scalar.max = output_max; in xnn_init_f32_minmax_params()
798 return params; in xnn_init_f32_minmax_params()
805 union xnn_f32_minmax_params params; in xnn_init_scalar_f32_minmax_params() local
806 params.scalar.min = output_min; in xnn_init_scalar_f32_minmax_params()
807 params.scalar.max = output_max; in xnn_init_scalar_f32_minmax_params()
808 return params; in xnn_init_scalar_f32_minmax_params()
813 struct xnn_f16_hswish_params params; in xnn_init_f16_hswish_params() local
814 params.sixth = UINT16_C(0x3155); in xnn_init_f16_hswish_params()
815 params.three = UINT16_C(0x4200); in xnn_init_f16_hswish_params()
816 params.six = UINT16_C(0x4600); in xnn_init_f16_hswish_params()
817 return params; in xnn_init_f16_hswish_params()
822 union xnn_f32_hswish_params params; in xnn_init_f32_hswish_params() local
825 params.sse.sixth[i] = 0x1.555556p-3f; in xnn_init_f32_hswish_params()
826 params.sse.half[i] = 0.5f; in xnn_init_f32_hswish_params()
827 params.sse.one[i] = 1.0f; in xnn_init_f32_hswish_params()
830 params.scalar.sixth = 0x1.555556p-3f; in xnn_init_f32_hswish_params()
831 params.scalar.three = 3.0f; in xnn_init_f32_hswish_params()
832 params.scalar.six = 6.0f; in xnn_init_f32_hswish_params()
834 return params; in xnn_init_f32_hswish_params()
839 union xnn_f32_hswish_params params; in xnn_init_scalar_f32_hswish_params() local
840 params.scalar.sixth = 0x1.555556p-3f; in xnn_init_scalar_f32_hswish_params()
841 params.scalar.three = 3.0f; in xnn_init_scalar_f32_hswish_params()
842 params.scalar.six = 6.0f; in xnn_init_scalar_f32_hswish_params()
843 return params; in xnn_init_scalar_f32_hswish_params()
848 union xnn_f32_abs_params params = { 0 }; in xnn_init_f32_abs_params() local
851 params.sse.nonsign_mask[i] = math_nonsign_mask_f32(); in xnn_init_f32_abs_params()
854 params.wasmsimd.nonsign_mask = math_nonsign_mask_f32(); in xnn_init_f32_abs_params()
856 return params; in xnn_init_f32_abs_params()
861 union xnn_f32_abs_params params = { 0 }; in xnn_init_scalar_f32_abs_params() local
862 return params; in xnn_init_scalar_f32_abs_params()
867 union xnn_f32_neg_params params = { 0 }; in xnn_init_f32_neg_params() local
870 params.sse.sign_mask[i] = -0.0f; in xnn_init_f32_neg_params()
873 params.wasmsimd.sign_mask = -0.0f; in xnn_init_f32_neg_params()
875 return params; in xnn_init_f32_neg_params()
880 union xnn_f32_neg_params params = { 0 }; in xnn_init_scalar_f32_neg_params() local
881 return params; in xnn_init_scalar_f32_neg_params()
886 union xnn_f32_rnd_params params = { 0 }; in xnn_init_f32_rnd_params() local
889 params.sse2.sign_mask[i] = -0.0f; in xnn_init_f32_rnd_params()
892 params.sse2.one[i] = 1.0f; in xnn_init_f32_rnd_params()
895 return params; in xnn_init_f32_rnd_params()
900 union xnn_f32_rnd_params params = { 0 }; in xnn_init_scalar_f32_rnd_params() local
901 return params; in xnn_init_scalar_f32_rnd_params()
906 union xnn_f32_elu_params params; in xnn_init_f32_elu_params() local
909 params.sse.prescale[i] = prescale; in xnn_init_f32_elu_params()
910 params.sse.alpha[i] = alpha; in xnn_init_f32_elu_params()
911 params.sse.beta[i] = beta; in xnn_init_f32_elu_params()
914 params.scalar.prescale = prescale; in xnn_init_f32_elu_params()
915 params.scalar.alpha = alpha; in xnn_init_f32_elu_params()
916 params.scalar.beta = beta; in xnn_init_f32_elu_params()
918 return params; in xnn_init_f32_elu_params()
923 union xnn_f32_elu_params params; in xnn_init_scalar_f32_elu_params() local
924 params.scalar.prescale = prescale; in xnn_init_scalar_f32_elu_params()
925 params.scalar.alpha = alpha; in xnn_init_scalar_f32_elu_params()
926 params.scalar.beta = beta; in xnn_init_scalar_f32_elu_params()
927 return params; in xnn_init_scalar_f32_elu_params()
932 union xnn_f32_lrelu_params params; in xnn_init_f32_lrelu_params() local
935 params.sse.slope[i] = slope; in xnn_init_f32_lrelu_params()
938 params.scalar.slope = slope; in xnn_init_f32_lrelu_params()
940 return params; in xnn_init_f32_lrelu_params()
945 union xnn_f32_lrelu_params params; in xnn_init_scalar_f32_lrelu_params() local
946 params.scalar.slope = slope; in xnn_init_scalar_f32_lrelu_params()
947 return params; in xnn_init_scalar_f32_lrelu_params()
952 union xnn_f32_sqrt_params params = { 0 }; in xnn_init_f32_sqrt_params() local
954 params.fma.half = 0.5f; in xnn_init_f32_sqrt_params()
956 return params; in xnn_init_f32_sqrt_params()
961 union xnn_f32_sqrt_params params = { 0 }; in xnn_init_scalar_f32_sqrt_params() local
962 return params; in xnn_init_scalar_f32_sqrt_params()
970 union xnn_f32_chw_params params; in xnn_init_f32_chw_params() local
973 params.sse.min[i] = output_min; in xnn_init_f32_chw_params()
974 params.sse.max[i] = output_max; in xnn_init_f32_chw_params()
978 params.sse.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_chw_params()
979 params.sse.mask[1] = -(uint32_t) (w4 >= 1); in xnn_init_f32_chw_params()
980 params.sse.mask[2] = -(uint32_t) (w4 >= 2); in xnn_init_f32_chw_params()
981 params.sse.mask[3] = -(uint32_t) (w4 >= 3); in xnn_init_f32_chw_params()
984 params.sse.mask_even[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_chw_params()
985 params.sse.mask_even[1] = -(uint32_t) (w8 >= 2); in xnn_init_f32_chw_params()
986 params.sse.mask_even[2] = -(uint32_t) (w8 >= 4); in xnn_init_f32_chw_params()
987 params.sse.mask_even[3] = -(uint32_t) (w8 >= 6); in xnn_init_f32_chw_params()
988 params.sse.mask_odd[0] = -(uint32_t) (w8 >= 1); in xnn_init_f32_chw_params()
989 params.sse.mask_odd[1] = -(uint32_t) (w8 >= 3); in xnn_init_f32_chw_params()
990 params.sse.mask_odd[2] = -(uint32_t) (w8 >= 5); in xnn_init_f32_chw_params()
991 params.sse.mask_odd[3] = -(uint32_t) (w8 >= 7); in xnn_init_f32_chw_params()
993 params.neon.min = output_min; in xnn_init_f32_chw_params()
994 params.neon.max = output_max; in xnn_init_f32_chw_params()
997 params.neon.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_chw_params()
998 params.neon.mask[1] = -(uint32_t) (w4 >= 1); in xnn_init_f32_chw_params()
999 params.neon.mask[2] = -(uint32_t) (w4 >= 2); in xnn_init_f32_chw_params()
1000 params.neon.mask[3] = -(uint32_t) (w4 >= 3); in xnn_init_f32_chw_params()
1003 params.neon.mask_even[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_chw_params()
1004 params.neon.mask_even[1] = -(uint32_t) (w8 >= 2); in xnn_init_f32_chw_params()
1005 params.neon.mask_even[2] = -(uint32_t) (w8 >= 4); in xnn_init_f32_chw_params()
1006 params.neon.mask_even[3] = -(uint32_t) (w8 >= 6); in xnn_init_f32_chw_params()
1007 params.neon.mask_odd[0] = -(uint32_t) (w8 >= 1); in xnn_init_f32_chw_params()
1008 params.neon.mask_odd[1] = -(uint32_t) (w8 >= 3); in xnn_init_f32_chw_params()
1009 params.neon.mask_odd[2] = -(uint32_t) (w8 >= 5); in xnn_init_f32_chw_params()
1010 params.neon.mask_odd[3] = -(uint32_t) (w8 >= 7); in xnn_init_f32_chw_params()
1012 params.scalar.min = output_min; in xnn_init_f32_chw_params()
1013 params.scalar.max = output_max; in xnn_init_f32_chw_params()
1016 params.scalar.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_chw_params()
1017 params.scalar.mask[1] = -(uint32_t) (w4 >= 1); in xnn_init_f32_chw_params()
1018 params.scalar.mask[2] = -(uint32_t) (w4 >= 2); in xnn_init_f32_chw_params()
1019 params.scalar.mask[3] = -(uint32_t) (w4 >= 3); in xnn_init_f32_chw_params()
1022 params.scalar.mask_even[0] = UINT32_C(0xFFFFFFFF); in xnn_init_f32_chw_params()
1023 params.scalar.mask_even[1] = -(uint32_t) (w8 >= 2); in xnn_init_f32_chw_params()
1024 params.scalar.mask_even[2] = -(uint32_t) (w8 >= 4); in xnn_init_f32_chw_params()
1025 params.scalar.mask_even[3] = -(uint32_t) (w8 >= 6); in xnn_init_f32_chw_params()
1026 params.scalar.mask_odd[0] = -(uint32_t) (w8 >= 1); in xnn_init_f32_chw_params()
1027 params.scalar.mask_odd[1] = -(uint32_t) (w8 >= 3); in xnn_init_f32_chw_params()
1028 params.scalar.mask_odd[2] = -(uint32_t) (w8 >= 5); in xnn_init_f32_chw_params()
1029 params.scalar.mask_odd[3] = -(uint32_t) (w8 >= 7); in xnn_init_f32_chw_params()
1031 return params; in xnn_init_f32_chw_params()
1035 union xnn_f32_chw_params* params, in xnn_update_f32_chw_params() argument
1040 params->sse.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_chw_params()
1041 params->sse.mask[1] = -(uint32_t) (w4 >= 1); in xnn_update_f32_chw_params()
1042 params->sse.mask[2] = -(uint32_t) (w4 >= 2); in xnn_update_f32_chw_params()
1043 params->sse.mask[3] = -(uint32_t) (w4 >= 3); in xnn_update_f32_chw_params()
1046 params->sse.mask_even[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_chw_params()
1047 params->sse.mask_even[1] = -(uint32_t) (w8 >= 2); in xnn_update_f32_chw_params()
1048 params->sse.mask_even[2] = -(uint32_t) (w8 >= 4); in xnn_update_f32_chw_params()
1049 params->sse.mask_even[3] = -(uint32_t) (w8 >= 6); in xnn_update_f32_chw_params()
1050 params->sse.mask_odd[0] = -(uint32_t) (w8 >= 1); in xnn_update_f32_chw_params()
1051 params->sse.mask_odd[1] = -(uint32_t) (w8 >= 3); in xnn_update_f32_chw_params()
1052 params->sse.mask_odd[2] = -(uint32_t) (w8 >= 5); in xnn_update_f32_chw_params()
1053 params->sse.mask_odd[3] = -(uint32_t) (w8 >= 7); in xnn_update_f32_chw_params()
1056 params->neon.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_chw_params()
1057 params->neon.mask[1] = -(uint32_t) (w4 >= 1); in xnn_update_f32_chw_params()
1058 params->neon.mask[2] = -(uint32_t) (w4 >= 2); in xnn_update_f32_chw_params()
1059 params->neon.mask[3] = -(uint32_t) (w4 >= 3); in xnn_update_f32_chw_params()
1062 params->neon.mask_even[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_chw_params()
1063 params->neon.mask_even[1] = -(uint32_t) (w8 >= 2); in xnn_update_f32_chw_params()
1064 params->neon.mask_even[2] = -(uint32_t) (w8 >= 4); in xnn_update_f32_chw_params()
1065 params->neon.mask_even[3] = -(uint32_t) (w8 >= 6); in xnn_update_f32_chw_params()
1066 params->neon.mask_odd[0] = -(uint32_t) (w8 >= 1); in xnn_update_f32_chw_params()
1067 params->neon.mask_odd[1] = -(uint32_t) (w8 >= 3); in xnn_update_f32_chw_params()
1068 params->neon.mask_odd[2] = -(uint32_t) (w8 >= 5); in xnn_update_f32_chw_params()
1069 params->neon.mask_odd[3] = -(uint32_t) (w8 >= 7); in xnn_update_f32_chw_params()
1072 params->scalar.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_chw_params()
1073 params->scalar.mask[1] = -(uint32_t) (w4 >= 1); in xnn_update_f32_chw_params()
1074 params->scalar.mask[2] = -(uint32_t) (w4 >= 2); in xnn_update_f32_chw_params()
1075 params->scalar.mask[3] = -(uint32_t) (w4 >= 3); in xnn_update_f32_chw_params()
1078 params->scalar.mask_even[0] = UINT32_C(0xFFFFFFFF); in xnn_update_f32_chw_params()
1079 params->scalar.mask_even[1] = -(uint32_t) (w8 >= 2); in xnn_update_f32_chw_params()
1080 params->scalar.mask_even[2] = -(uint32_t) (w8 >= 4); in xnn_update_f32_chw_params()
1081 params->scalar.mask_even[3] = -(uint32_t) (w8 >= 6); in xnn_update_f32_chw_params()
1082 params->scalar.mask_odd[0] = -(uint32_t) (w8 >= 1); in xnn_update_f32_chw_params()
1083 params->scalar.mask_odd[1] = -(uint32_t) (w8 >= 3); in xnn_update_f32_chw_params()
1084 params->scalar.mask_odd[2] = -(uint32_t) (w8 >= 5); in xnn_update_f32_chw_params()
1085 params->scalar.mask_odd[3] = -(uint32_t) (w8 >= 7); in xnn_update_f32_chw_params()
1094 union xnn_f32_chw_params params; in xnn_init_scalar_f32_chw_params() local
1095 params.scalar.min = output_min; in xnn_init_scalar_f32_chw_params()
1096 params.scalar.max = output_max; in xnn_init_scalar_f32_chw_params()
1099 params.scalar.mask[0] = UINT32_C(0xFFFFFFFF); in xnn_init_scalar_f32_chw_params()
1100 params.scalar.mask[1] = -(uint32_t) (w4 >= 1); in xnn_init_scalar_f32_chw_params()
1101 params.scalar.mask[2] = -(uint32_t) (w4 >= 2); in xnn_init_scalar_f32_chw_params()
1102 params.scalar.mask[3] = -(uint32_t) (w4 >= 3); in xnn_init_scalar_f32_chw_params()
1105 params.scalar.mask_even[0] = UINT32_C(0xFFFFFFFF); in xnn_init_scalar_f32_chw_params()
1106 params.scalar.mask_even[1] = -(uint32_t) (w8 >= 2); in xnn_init_scalar_f32_chw_params()
1107 params.scalar.mask_even[2] = -(uint32_t) (w8 >= 4); in xnn_init_scalar_f32_chw_params()
1108 params.scalar.mask_even[3] = -(uint32_t) (w8 >= 6); in xnn_init_scalar_f32_chw_params()
1109 params.scalar.mask_odd[0] = -(uint32_t) (w8 >= 1); in xnn_init_scalar_f32_chw_params()
1110 params.scalar.mask_odd[1] = -(uint32_t) (w8 >= 3); in xnn_init_scalar_f32_chw_params()
1111 params.scalar.mask_odd[2] = -(uint32_t) (w8 >= 5); in xnn_init_scalar_f32_chw_params()
1112 params.scalar.mask_odd[3] = -(uint32_t) (w8 >= 7); in xnn_init_scalar_f32_chw_params()
1114 return params; in xnn_init_scalar_f32_chw_params()
1123 union xnn_u8_minmax_params params; in xnn_init_u8_minmax_params() local
1126 params.sse2.min[i] = output_min; in xnn_init_u8_minmax_params()
1127 params.sse2.max[i] = output_max; in xnn_init_u8_minmax_params()
1130 params.neon.min = output_min; in xnn_init_u8_minmax_params()
1131 params.neon.max = output_max; in xnn_init_u8_minmax_params()
1133 params.scalar.min = (int32_t) (uint32_t) output_min; in xnn_init_u8_minmax_params()
1134 params.scalar.max = (int32_t) (uint32_t) output_max; in xnn_init_u8_minmax_params()
1136 return params; in xnn_init_u8_minmax_params()
1145 union xnn_u8_minmax_params params; in xnn_init_scalar_u8_minmax_params() local
1146 params.scalar.min = (int32_t) (uint32_t) output_min; in xnn_init_scalar_u8_minmax_params()
1147 params.scalar.max = (int32_t) (uint32_t) output_max; in xnn_init_scalar_u8_minmax_params()
1148 return params; in xnn_init_scalar_u8_minmax_params()
1185 union xnn_qu8_add_params params; in xnn_init_qu8_add_params() local
1192 params.sse2.zero_point_product[i] = zero_point_product; in xnn_init_qu8_add_params()
1195 params.sse2.y_zero_point[i] = (int16_t) (uint16_t) output_zero_point; in xnn_init_qu8_add_params()
1198 params.sse2.a_multiplier_lo[i] = (uint16_t) (uint32_t) a_multiplier; in xnn_init_qu8_add_params()
1199 params.sse2.a_multiplier_hi[i] = (uint16_t) ((uint32_t) a_multiplier >> 16); in xnn_init_qu8_add_params()
1200 params.sse2.b_multiplier_lo[i] = (uint16_t) (uint32_t) b_multiplier; in xnn_init_qu8_add_params()
1201 params.sse2.b_multiplier_hi[i] = (uint16_t) ((uint32_t) b_multiplier >> 16); in xnn_init_qu8_add_params()
1203 params.sse2.a_multiplier = a_multiplier; in xnn_init_qu8_add_params()
1204 params.sse2.b_multiplier = b_multiplier; in xnn_init_qu8_add_params()
1206 params.sse2.remainder_mask[i] = remainder_mask; in xnn_init_qu8_add_params()
1207 params.sse2.remainder_threshold[i] = remainder_threshold; in xnn_init_qu8_add_params()
1209 params.sse2.shift = shift; in xnn_init_qu8_add_params()
1211 params.sse2.y_min[i] = output_min; in xnn_init_qu8_add_params()
1212 params.sse2.y_max[i] = output_max; in xnn_init_qu8_add_params()
1215 params.neon.a_zero_point = a_zero_point; in xnn_init_qu8_add_params()
1216 params.neon.b_zero_point = b_zero_point; in xnn_init_qu8_add_params()
1217 params.neon.y_zero_point = (int16_t) (uint16_t) output_zero_point; in xnn_init_qu8_add_params()
1218 params.neon.a_multiplier = (int32_t) a_multiplier; in xnn_init_qu8_add_params()
1219 params.neon.b_multiplier = (int32_t) b_multiplier; in xnn_init_qu8_add_params()
1220 params.neon.right_shift = (int32_t) -shift; in xnn_init_qu8_add_params()
1221 params.neon.y_min = output_min; in xnn_init_qu8_add_params()
1222 params.neon.y_max = output_max; in xnn_init_qu8_add_params()
1226 params.scalar.zero_point_product = in xnn_init_qu8_add_params()
1228 params.scalar.a_multiplier = a_multiplier; in xnn_init_qu8_add_params()
1229 params.scalar.b_multiplier = b_multiplier; in xnn_init_qu8_add_params()
1230 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_qu8_add_params()
1231 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_qu8_add_params()
1232 params.scalar.shift = shift; in xnn_init_qu8_add_params()
1233 params.scalar.y_zero_point = (int32_t) (uint32_t) output_zero_point; in xnn_init_qu8_add_params()
1234 params.scalar.y_min = (int32_t) (uint32_t) output_min; in xnn_init_qu8_add_params()
1235 params.scalar.y_max = (int32_t) (uint32_t) output_max; in xnn_init_qu8_add_params()
1237 return params; in xnn_init_qu8_add_params()
1272 union xnn_qu8_add_params params; in xnn_init_scalar_qu8_add_params() local
1275 params.scalar.zero_point_product = in xnn_init_scalar_qu8_add_params()
1277 params.scalar.a_multiplier = a_multiplier; in xnn_init_scalar_qu8_add_params()
1278 params.scalar.b_multiplier = b_multiplier; in xnn_init_scalar_qu8_add_params()
1279 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_scalar_qu8_add_params()
1280 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_scalar_qu8_add_params()
1281 params.scalar.shift = shift; in xnn_init_scalar_qu8_add_params()
1282 params.scalar.y_zero_point = (int32_t) (uint32_t) output_zero_point; in xnn_init_scalar_qu8_add_params()
1283 params.scalar.y_min = (int32_t) (uint32_t) output_min; in xnn_init_scalar_qu8_add_params()
1284 params.scalar.y_max = (int32_t) (uint32_t) output_max; in xnn_init_scalar_qu8_add_params()
1285 return params; in xnn_init_scalar_qu8_add_params()
1322 union xnn_qs8_add_params params; in xnn_init_qs8_add_params() local
1329 params.sse2.zero_point_product[i] = zero_point_product; in xnn_init_qs8_add_params()
1336 params.sse2.x_multiplier_lo[i] = x_multiplier_lo; in xnn_init_qs8_add_params()
1337 params.sse2.x_multiplier_hi[i] = x_multiplier_hi; in xnn_init_qs8_add_params()
1338 params.sse2.y_multiplier_lo[i] = y_multiplier_lo; in xnn_init_qs8_add_params()
1339 params.sse2.y_multiplier_hi[i] = y_multiplier_hi; in xnn_init_qs8_add_params()
1341 params.sse2.shift = shift; in xnn_init_qs8_add_params()
1343 params.sse2.x_multiplier[i] = x_multiplier; in xnn_init_qs8_add_params()
1344 params.sse2.y_multiplier[i] = y_multiplier; in xnn_init_qs8_add_params()
1345 params.sse2.remainder_mask[i] = remainder_mask; in xnn_init_qs8_add_params()
1346 params.sse2.remainder_threshold[i] = remainder_threshold; in xnn_init_qs8_add_params()
1349 params.sse2.output_zero_point[i] = (int16_t) output_zero_point; in xnn_init_qs8_add_params()
1350 params.sse2.output_min[i] = (int16_t) output_min; in xnn_init_qs8_add_params()
1351 params.sse2.output_max[i] = (int16_t) output_max; in xnn_init_qs8_add_params()
1354 params.neon.x_zero_point = x_zero_point; in xnn_init_qs8_add_params()
1355 params.neon.y_zero_point = y_zero_point; in xnn_init_qs8_add_params()
1356 params.neon.x_multiplier = (int32_t) x_multiplier; in xnn_init_qs8_add_params()
1357 params.neon.y_multiplier = (int32_t) y_multiplier; in xnn_init_qs8_add_params()
1358 params.neon.right_shift = (int32_t) -shift; in xnn_init_qs8_add_params()
1359 params.neon.output_zero_point = (int16_t) output_zero_point; in xnn_init_qs8_add_params()
1360 params.neon.output_min = output_min; in xnn_init_qs8_add_params()
1361 params.neon.output_max = output_max; in xnn_init_qs8_add_params()
1368 params.wasmsimd.zero_point_product[i] = zero_point_product; in xnn_init_qs8_add_params()
1369 params.wasmsimd.x_multiplier[i] = x_multiplier; in xnn_init_qs8_add_params()
1370 params.wasmsimd.y_multiplier[i] = y_multiplier; in xnn_init_qs8_add_params()
1371 params.wasmsimd.remainder_mask[i] = remainder_mask; in xnn_init_qs8_add_params()
1372 params.wasmsimd.remainder_threshold[i] = remainder_threshold; in xnn_init_qs8_add_params()
1374 params.wasmsimd.shift = shift; in xnn_init_qs8_add_params()
1376 params.wasmsimd.output_zero_point[i] = (int16_t) output_zero_point; in xnn_init_qs8_add_params()
1379 params.wasmsimd.output_min[i] = output_min; in xnn_init_qs8_add_params()
1380 params.wasmsimd.output_max[i] = output_max; in xnn_init_qs8_add_params()
1385 params.scalar.zero_point_product = in xnn_init_qs8_add_params()
1387 params.scalar.x_multiplier = x_multiplier; in xnn_init_qs8_add_params()
1388 params.scalar.y_multiplier = y_multiplier; in xnn_init_qs8_add_params()
1389 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_qs8_add_params()
1390 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_qs8_add_params()
1391 params.scalar.shift = (int32_t) shift; in xnn_init_qs8_add_params()
1392 params.scalar.output_zero_point = (int32_t) output_zero_point; in xnn_init_qs8_add_params()
1393 params.scalar.output_min = (int32_t) output_min; in xnn_init_qs8_add_params()
1394 params.scalar.output_max = (int32_t) output_max; in xnn_init_qs8_add_params()
1396 return params; in xnn_init_qs8_add_params()
1431 union xnn_qs8_add_params params; in xnn_init_scalar_qs8_add_params() local
1434 params.scalar.zero_point_product = in xnn_init_scalar_qs8_add_params()
1436 params.scalar.x_multiplier = x_multiplier; in xnn_init_scalar_qs8_add_params()
1437 params.scalar.y_multiplier = y_multiplier; in xnn_init_scalar_qs8_add_params()
1438 params.scalar.remainder_mask = (int32_t) remainder_mask; in xnn_init_scalar_qs8_add_params()
1439 params.scalar.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_scalar_qs8_add_params()
1440 params.scalar.shift = shift; in xnn_init_scalar_qs8_add_params()
1441 params.scalar.output_zero_point = (int32_t) output_zero_point; in xnn_init_scalar_qs8_add_params()
1442 params.scalar.output_min = (int32_t) output_min; in xnn_init_scalar_qs8_add_params()
1443 params.scalar.output_max = (int32_t) output_max; in xnn_init_scalar_qs8_add_params()
1444 return params; in xnn_init_scalar_qs8_add_params()
1468 union xnn_qu8_requantization_params params; in xnn_init_scalar_qu8_requantization_params() local
1471 params.q31.multiplier = multiplier; in xnn_init_scalar_qu8_requantization_params()
1472 params.q31.remainder_mask = (int32_t) remainder_mask; in xnn_init_scalar_qu8_requantization_params()
1473 params.q31.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_scalar_qu8_requantization_params()
1474 params.q31.shift = (uint32_t) shift; in xnn_init_scalar_qu8_requantization_params()
1475 params.q31.min_less_zero_point = (int32_t) (uint32_t) min - (int32_t) (uint32_t) zero_point; in xnn_init_scalar_qu8_requantization_params()
1476 params.q31.max_less_zero_point = (int32_t) (uint32_t) max - (int32_t) (uint32_t) zero_point; in xnn_init_scalar_qu8_requantization_params()
1477 params.q31.zero_point = (int32_t) (uint32_t) zero_point; in xnn_init_scalar_qu8_requantization_params()
1478 return params; in xnn_init_scalar_qu8_requantization_params()
1502 union xnn_qs8_requantization_params params; in xnn_init_scalar_qs8_requantization_params() local
1505 params.q31.multiplier = multiplier; in xnn_init_scalar_qs8_requantization_params()
1506 params.q31.remainder_mask = (int32_t) remainder_mask; in xnn_init_scalar_qs8_requantization_params()
1507 params.q31.remainder_threshold = (int32_t) remainder_threshold; in xnn_init_scalar_qs8_requantization_params()
1508 params.q31.shift = (uint32_t) shift; in xnn_init_scalar_qs8_requantization_params()
1509 params.q31.min_less_zero_point = (int32_t) min - (int32_t) zero_point; in xnn_init_scalar_qs8_requantization_params()
1510 params.q31.max_less_zero_point = (int32_t) max - (int32_t) zero_point; in xnn_init_scalar_qs8_requantization_params()
1511 params.q31.zero_point = (int32_t) zero_point; in xnn_init_scalar_qs8_requantization_params()
1512 return params; in xnn_init_scalar_qs8_requantization_params()