[arm]fix concat axis < 0 compute error problem (#3802)

* fix concatt axis < 0 errorr,ttest=develop * fix format. test=develop

[arm]fix concat axis < 0 compute error problem (#3802)
* fix concatt axis < 0 errorr,ttest=develop * fix format. test=develop
4030e756 · HappyAngel · GitHub · 30616633 · 4030e756 · 4030e756
隐藏空白更改
内联并排

Showing with 8 addition and 9 deletion

lite/core/mir/fusion/conv_activation_fuse_pass.cc lite/core/mir/fusion/conv_activation_fuse_pass.cc +4 -4

lite/kernels/arm/concat_compute.cc lite/kernels/arm/concat_compute.cc +4 -5

未找到文件。
--- a/lite/core/mir/fusion/conv_activation_fuse_pass.cc
+++ b/lite/core/mir/fusion/conv_activation_fuse_pass.cc
@@ -25,21 +25,21 @@ namespace mir {
 void ConvActivationFusePass::Apply(const std::unique_ptr<SSAGraph>& graph) {
  std::vector<std::string> act_types{"relu"};
  bool has_int8 = false;
-  bool has_arm_float = false;
+  bool has_arm = false;
  bool has_cuda = false;
  for (auto& place : graph->valid_places()) {
    if (place.precision == PRECISION(kInt8)) {
      has_int8 = true;
    }
-    if (place.target == TARGET(kARM) && place.precision == PRECISION(kFloat)) {
+    if (place.target == TARGET(kARM)) {
-      has_arm_float = true;
+      has_arm = true;
    }
    if (place.target == TARGET(kCUDA)) {
      has_cuda = true;
    }
  }
-  if (!has_int8 && has_arm_float) {
+  if (has_arm) {
    act_types.push_back("relu6");
    act_types.push_back("leaky_relu");
  }

--- a/lite/kernels/arm/concat_compute.cc
+++ b/lite/kernels/arm/concat_compute.cc
@@ -52,11 +52,7 @@ void ConcatFunc(const std::vector<lite::Tensor*> inputs,
      output_offset += in_stride[0];
    }
  } else {
-    std::vector<lite::Tensor*> inputs_concat(inputs.size());
+    lite::arm::math::concat_func<T>(inputs, axis, out);
-    for (int j = 0; j < inputs.size(); ++j) {
-      inputs_concat[j] = inputs[j];
-    }
-    lite::arm::math::concat_func<T>(inputs_concat, axis, out);
  }
 }
@@ -71,6 +67,9 @@ void ConcatCompute::Run() {
    auto* axis_tensor_data = axis_tensor->data<int>();
    axis = axis_tensor_data[0];
  }
+  if (axis < 0) {
+    axis += inputs[0]->dims().size();
+  }
  switch (inputs.front()->precision()) {
    case PRECISION(kFloat):