/external/XNNPACK/test/ |
D | f32-conv-hwc.cc | 214 TEST(F32_CONV_3X3S2P1C3X8__NEON_2X2, output_y_start) { in TEST() argument 216 for (size_t output_y_start = 1; output_y_start <= 3; output_y_start++) { in TEST() local 228 .output_y_start(output_y_start) in TEST() 494 TEST(F32_CONV_3X3S2P1C3X4__NEON_2X2, output_y_start) { in TEST() argument 496 for (size_t output_y_start = 1; output_y_start <= 3; output_y_start++) { in TEST() local 508 .output_y_start(output_y_start) in TEST() 775 TEST(F32_CONV_3X3S2P0P1C3X8__NEON_2X2, output_y_start) { in TEST() argument 777 for (size_t output_y_start = 1; output_y_start <= 3; output_y_start++) { in TEST() local 789 .output_y_start(output_y_start) in TEST() 1056 TEST(F32_CONV_3X3S2P0P1C3X4__NEON_2X2, output_y_start) { in TEST() argument [all …]
|
D | f32-conv-hwc2chw.cc | 214 TEST(F32_CONV_HWC2CHW_3X3S2P1C3X4__NEON_2X2, output_y_start) { in TEST() argument 216 for (size_t output_y_start = 1; output_y_start <= 3; output_y_start++) { in TEST() local 228 .output_y_start(output_y_start) in TEST() 495 TEST(F32_CONV_HWC2CHW_3X3S2P1C3X4__NEONFMA_2X2, output_y_start) { in TEST() argument 497 for (size_t output_y_start = 1; output_y_start <= 3; output_y_start++) { in TEST() local 509 .output_y_start(output_y_start) in TEST() 744 TEST(F32_CONV_HWC2CHW_3X3S2P1C3X4__SSE_1X1, output_y_start) { in TEST() argument 746 for (size_t output_y_start = 1; output_y_start <= 3; output_y_start++) { in TEST() local 758 .output_y_start(output_y_start) in TEST() 993 TEST(F32_CONV_HWC2CHW_3X3S2P1C3X4__SSE_2X2, output_y_start) { in TEST() argument [all …]
|
D | conv-hwc2chw-microkernel-tester.h | 215 inline ConvHWC2CHWMicrokernelTester& output_y_start(uint32_t output_y_start) { in output_y_start() argument 216 this->output_y_start_ = output_y_start; in output_y_start() 220 inline uint32_t output_y_start() const { in output_y_start() function 291 ASSERT_LT(output_y_start(), output_height()); 293 ASSERT_GT(output_y_end(), output_y_start()); 377 output_y_start(), output_y_end(), 386 for (size_t y = output_y_start(); y < output_y_end(); y++) {
|
D | conv-hwc-microkernel-tester.h | 215 inline ConvHWCMicrokernelTester& output_y_start(uint32_t output_y_start) { in output_y_start() function 216 this->output_y_start_ = output_y_start; in output_y_start() 220 inline uint32_t output_y_start() const { in output_y_start() function 285 ASSERT_LT(output_y_start(), output_height()); 287 ASSERT_GT(output_y_end(), output_y_start()); 371 output_y_start(), output_y_end(), 380 for (size_t y = output_y_start(); y < output_y_end(); y++) {
|
/external/XNNPACK/src/xnnpack/ |
D | conv.h | 26 size_t output_y_start, \ 63 size_t output_y_start, \
|
/external/XNNPACK/src/f32-conv-hwc2chw/ |
D | 3x3s2p1c3x4-sse-1x1.c | 17 size_t output_y_start, in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() argument 30 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 40 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 43 float* output0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 45 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1() 52 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 1) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_1x1()
|
D | 3x3s2p1c3x4-scalar-1x1.c | 15 size_t output_y_start, in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() argument 28 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 38 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 41 float* output0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 43 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1() 50 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 1) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__scalar_1x1()
|
D | 3x3s2p1c3x4-neonfma-2x2.c | 17 size_t output_y_start, in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() argument 30 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 40 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 45 float* output0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 48 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2() 55 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neonfma_2x2()
|
D | 3x3s2p1c3x4-neon-2x2.c | 17 size_t output_y_start, in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() argument 30 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 40 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 45 float* output0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 48 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2() 55 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__neon_2x2()
|
D | 3x3s2p1c3x4-wasmsimd-2x2.c | 17 size_t output_y_start, in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() argument 30 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 40 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 45 float* output0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 48 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2() 56 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__wasmsimd_2x2()
|
D | 3x3s2p1c3x4-sse-2x2.c | 17 size_t output_y_start, in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() argument 30 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 40 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 45 float* output0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 48 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2() 55 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc2chw_ukernel_3x3s2p1c3x4__sse_2x2()
|
/external/XNNPACK/src/f32-conv-hwc/gen/ |
D | 3x3s2p0p1c3x4-neon-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1() 60 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x1()
|
D | 3x3s2p1c3x4-neonfma-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1() 62 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x1()
|
D | 3x3s2p1c3x4-neon-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1() 60 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x1()
|
D | 3x3s2p0p1c3x4-neonfma-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1() 62 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x1()
|
D | 3x3s2p1c3x8-neon-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1() 60 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neon_2x1()
|
D | 3x3s2p0p1c3x8-neonfma-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1() 62 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neonfma_2x1()
|
D | 3x3s2p1c3x8-neonfma-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1() 62 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x8__neonfma_2x1()
|
D | 3x3s2p0p1c3x8-neon-2x1.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1() 60 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x8__neon_2x1()
|
D | 3x3s2p0p1c3x4-neonfma-2x2.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2() 62 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neonfma_2x2()
|
D | 3x3s2p1c3x4-neon-2x2.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2() 60 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neon_2x2()
|
D | 3x3s2p0p1c3x4-neon-2x2.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2() 60 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__neon_2x2()
|
D | 3x3s2p1c3x4-neonfma-2x2.c | 22 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() argument 35 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 47 input_height_stride * (output_y_start * 2 /* vertical stride */ - input_padding_top)); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 52 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 55 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2() 62 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 2) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__neonfma_2x2()
|
/external/XNNPACK/src/f32-conv-hwc/ |
D | 3x3s2p1c3x4-scalar-1x1.c | 15 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__scalar_1x1() argument 28 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__scalar_1x1() 39 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__scalar_1x1() 42 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__scalar_1x1() 44 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__scalar_1x1() 51 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 1) { in xnn_f32_conv_hwc_ukernel_3x3s2p1c3x4__scalar_1x1()
|
D | 3x3s2p0p1c3x4-scalar-1x1.c | 15 size_t output_y_start, in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__scalar_1x1() argument 28 assert(output_y_end > output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__scalar_1x1() 39 …const float* i0 = (const float*) ((uintptr_t) input + input_height_stride * (output_y_start * 2 - … in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__scalar_1x1() 42 float* o0 = (float*) ((uintptr_t) output + output_height_stride * output_y_start); in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__scalar_1x1() 44 if XNN_UNPREDICTABLE(output_y_start < input_padding_top) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__scalar_1x1() 51 for (size_t output_y = output_y_start; output_y < output_y_end; output_y += 1) { in xnn_f32_conv_hwc_ukernel_3x3s2p0p1c3x4__scalar_1x1()
|