Lines Matching refs:vi4x5678

233       const __m128 vi4x5678 = _mm_shuffle_ps(vi4x8567, vi4x8567, _MM_SHUFFLE(0, 3, 2, 1));  in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()  local
245 vo2p1 = _mm_add_ps(vo2p1, _mm_mul_ps(vi4x5678, vk23)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
247 vo1p0 = _mm_add_ps(vo1p0, _mm_mul_ps(vi4x5678, vk33)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
249 vo0p1 = _mm_add_ps(vo0p1, _mm_mul_ps(vi4x5678, vk43)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
257 const __m128 vi4x6789 = _mm_shuffle_ps(vi4x5678, vi4x89AB, _MM_SHUFFLE(1, 0, 2, 1)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
411 const __m128 vi4x5678 = _mm_shuffle_ps(vi4x8567, vi4x8567, _MM_SHUFFLE(0, 3, 2, 1)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2() local
423 vo2p1 = _mm_add_ps(vo2p1, _mm_mul_ps(vi4x5678, vk23)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
425 vo1p0 = _mm_add_ps(vo1p0, _mm_mul_ps(vi4x5678, vk33)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
427 vo0p1 = _mm_add_ps(vo0p1, _mm_mul_ps(vi4x5678, vk43)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
435 const __m128 vi4x6789 = _mm_shuffle_ps(vi4x5678, vi4x89AB, _MM_SHUFFLE(1, 0, 2, 1)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
572 const __m128 vi4x5678 = _mm_shuffle_ps(vi4x8567, vi4x8567, _MM_SHUFFLE(0, 3, 2, 1)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2() local
584 vo2p1 = _mm_add_ps(vo2p1, _mm_mul_ps(vi4x5678, vk23)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
586 vo1p0 = _mm_add_ps(vo1p0, _mm_mul_ps(vi4x5678, vk33)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
588 vo0p1 = _mm_add_ps(vo0p1, _mm_mul_ps(vi4x5678, vk43)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()
596 const __m128 vi4x6789 = _mm_shuffle_ps(vi4x5678, vzero, _MM_SHUFFLE(1, 0, 2, 1)); in xnn_f32_dwconv2d_chw_ukernel_5x5p2__sse_3x4_acc2()