Searched refs:vkernel_zero_point (Results 1 – 3 of 3) sorted by relevance
/external/XNNPACK/src/qu8-dwconv/ |
D | up1x9-minmax-scalar.c | 22 const int32_t vkernel_zero_point = params->scalar.kernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() local 78 const int32_t vxk0 = (int32_t) vk0 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 83 const int32_t vxk1 = (int32_t) vk1 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 88 const int32_t vxk2 = (int32_t) vk2 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 93 const int32_t vxk3 = (int32_t) vk3 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 98 const int32_t vxk4 = (int32_t) vk4 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 103 const int32_t vxk5 = (int32_t) vk5 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 108 const int32_t vxk6 = (int32_t) vk6 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 113 const int32_t vxk7 = (int32_t) vk7 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar() 118 const int32_t vxk8 = (int32_t) vk8 - vkernel_zero_point; in xnn_qu8_dwconv_minmax_ukernel_up1x9__scalar()
|
D | up8x9-minmax-neon.c | 27 …const uint8x8_t vkernel_zero_point = vld1_dup_u8((const uint8_t*) ¶ms->neon.kernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() local 82 const int16x8_t vxk0 = vreinterpretq_s16_u16(vsubl_u8(vk0, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 89 const int16x8_t vxk1 = vreinterpretq_s16_u16(vsubl_u8(vk1, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 96 const int16x8_t vxk2 = vreinterpretq_s16_u16(vsubl_u8(vk2, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 103 const int16x8_t vxk3 = vreinterpretq_s16_u16(vsubl_u8(vk3, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 110 const int16x8_t vxk4 = vreinterpretq_s16_u16(vsubl_u8(vk4, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 117 const int16x8_t vxk5 = vreinterpretq_s16_u16(vsubl_u8(vk5, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 124 const int16x8_t vxk6 = vreinterpretq_s16_u16(vsubl_u8(vk6, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 131 const int16x8_t vxk7 = vreinterpretq_s16_u16(vsubl_u8(vk7, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() 138 const int16x8_t vxk8 = vreinterpretq_s16_u16(vsubl_u8(vk8, vkernel_zero_point)); in xnn_qu8_dwconv_minmax_ukernel_up8x9__neon() [all …]
|
D | up8x9-minmax-sse2.c | 26 …const __m128i vkernel_zero_point = _mm_load_si128((const __m128i*) params->sse2.kernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() local 78 const __m128i vxk0 = _mm_sub_epi16(_mm_unpacklo_epi8(vk0, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 87 const __m128i vxk1 = _mm_sub_epi16(_mm_unpacklo_epi8(vk1, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 96 const __m128i vxk2 = _mm_sub_epi16(_mm_unpacklo_epi8(vk2, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 105 const __m128i vxk3 = _mm_sub_epi16(_mm_unpacklo_epi8(vk3, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 114 const __m128i vxk4 = _mm_sub_epi16(_mm_unpacklo_epi8(vk4, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 123 const __m128i vxk5 = _mm_sub_epi16(_mm_unpacklo_epi8(vk5, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 132 const __m128i vxk6 = _mm_sub_epi16(_mm_unpacklo_epi8(vk6, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 141 const __m128i vxk7 = _mm_sub_epi16(_mm_unpacklo_epi8(vk7, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() 150 const __m128i vxk8 = _mm_sub_epi16(_mm_unpacklo_epi8(vk8, vzero), vkernel_zero_point); in xnn_qu8_dwconv_minmax_ukernel_up8x9__sse2() [all …]
|