From 37ddb91aaeaf8191bc8252adfee9f06a7b092fc2 Mon Sep 17 00:00:00 2001 From: xiaogang Date: Wed, 12 Feb 2020 14:45:36 +0800 Subject: [PATCH] fix: fix conv_winograd multithreads bug (#2816) fix conv_winograd multithreads bug --- lite/backends/arm/math/conv3x3_winograd_fp32_c4.cc | 9 +++------ 1 file changed, 3 insertions(+), 6 deletions(-) diff --git a/lite/backends/arm/math/conv3x3_winograd_fp32_c4.cc b/lite/backends/arm/math/conv3x3_winograd_fp32_c4.cc index 69a2454cf0..d1992f62bb 100644 --- a/lite/backends/arm/math/conv3x3_winograd_fp32_c4.cc +++ b/lite/backends/arm/math/conv3x3_winograd_fp32_c4.cc @@ -122,8 +122,7 @@ void conv_compute_6x6_3x3(const float* input, // begin compute for (int ni = 0; ni < num; ++ni) { -// trans input to c4 -#pragma omp parallel for num_threads(threads) + // trans input to c4 for (int i = 0; i < ic_4; ++i) { prepack_input_nxwc4_dw(input + ni * in_n_stride, input_c4 + i * new_c_stride, @@ -410,8 +409,7 @@ void conv_compute_2x2_3x3(const float* input, // begin compute for (int ni = 0; ni < num; ++ni) { -// trans input to c4 -#pragma omp parallel for num_threads(threads) + // trans input to c4 for (int i = 0; i < ic_4; ++i) { prepack_input_nxwc4_dw(input + ni * in_n_stride, input_c4 + i * new_c_stride, @@ -672,9 +670,8 @@ void conv_compute_2x2_3x3_small(const float* input, // begin compute for (int ni = 0; ni < num; ++ni) { -// trans input to c4 + // trans input to c4 -#pragma omp parallel for num_threads(threads) for (int i = 0; i < ic_4; ++i) { prepack_input_nxwc4_dw(input + ni * in_n_stride, input_c4 + i * new_c_stride, -- GitLab