/external/XNNPACK/src/f32-conv-hwc/gen/ |
D | 3x3s2p0p1c3x4-neonfma-2x2.c | 145 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() local 424 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() local 615 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() local
|
D | 3x3s2p1c3x4-neon-2x2.c | 150 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() local 424 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() local 617 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() local
|
D | 3x3s2p0p1c3x4-neon-2x2.c | 143 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() local 424 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() local 617 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() local
|
D | 3x3s2p1c3x4-neonfma-2x2.c | 152 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() local 424 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() local 615 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() local
|
D | 3x3s2p1c3x4-neonfma-2x1.c | 121 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1() local 313 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1() local
|
D | 3x3s2p0p1c3x4-neonfma-2x1.c | 121 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1() local 313 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1() local
|
D | 3x3s2p0p1c3x4-neon-2x1.c | 119 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1() local 313 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1() local
|
D | 3x3s2p1c3x4-neon-2x1.c | 119 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1() local 313 const float32x4_t vk20c1x0123 = vld1q_f32(w + 24); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1() local
|
D | 3x3s2p0p1c3x8-neon-2x2.c | 172 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x2() local 603 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x2() local 891 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x2() local
|
D | 3x3s2p1c3x8-neonfma-2x2.c | 181 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() local 603 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() local 889 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x2() local
|
D | 3x3s2p0p1c3x8-neonfma-2x2.c | 174 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x2() local 603 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x2() local 889 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x2() local
|
D | 3x3s2p1c3x8-neon-2x2.c | 179 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x2() local 603 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x2() local 891 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x2() local
|
D | 3x3s2p1c3x8-neon-2x1.c | 136 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1() local 425 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1() local
|
D | 3x3s2p0p1c3x8-neonfma-2x1.c | 138 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1() local 425 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1() local
|
D | 3x3s2p1c3x8-neonfma-2x1.c | 138 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1() local 425 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1() local
|
D | 3x3s2p0p1c3x8-neon-2x1.c | 136 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1() local 425 const float32x4_t vk20c1x0123 = vld1q_f32(w + 48); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1() local
|
/external/XNNPACK/src/f32-conv-hwc2chw/ |
D | 3x3s2p1c3x4-sse-1x1.c | 105 const __m128 vk20c1x0123 = _mm_load_ps(w + 24); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() local 232 const __m128 vk20c1x0123 = _mm_load_ps(w + 24); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() local
|