optimize eltwise computing order

ae7766cd · 虞连飞 · f654c291 · ae7766cd
隐藏空白更改
内联并排

Showing with 12 addition and 14 deletion

mace/ops/eltwise.cc mace/ops/eltwise.cc +12 -14

未找到文件。
--- a/mace/ops/eltwise.cc
+++ b/mace/ops/eltwise.cc
@@ -900,23 +900,21 @@ class EltwiseOp : public Operation {
        }
      }

-      if (need_general_broadcast) {
+      if (input1->size() == 1) {
+        TensorScalarEltwise(type_, input0_ptr, input1_ptr[0], coeff_,
+                            input0->size(), swapped, output_ptr);
+      } else if (input0_shape == input1_shape) {
+        TensorEltwise(type_, input0_ptr, input1_ptr, coeff_, input0->size(),
+                      swapped, output_ptr);
+      } else if (need_general_broadcast) {
        TensorGeneralBroadcastEltwise(type_, input0_ptr, input1_ptr, coeff_,
                                      swapped, input0_shape, input1_shape,
                                      output_shape, output_ptr);
-      } else if (input1->size() == input0->size()) {
-        TensorEltwise(type_, input0_ptr, input1_ptr, coeff_, input0->size(),
-                      swapped, output_ptr);
-      } else if (input1->size() < input0->size()) {
-        if (input1->size() > 1) {
-          index_t common_size = input1->size();
-          index_t diff_size = input0->size() / common_size;
-          TensorBroadcastEltwise(type_, input0_ptr, input1_ptr, coeff_,
-                                 diff_size, common_size, swapped, output_ptr);
-        } else {
-          TensorScalarEltwise(type_, input0_ptr, input1_ptr[0], coeff_,
-                              input0->size(), swapped, output_ptr);
-        }
+      } else {
+        index_t common_size = input1->size();
+        index_t diff_size = input0->size() / common_size;
+        TensorBroadcastEltwise(type_, input0_ptr, input1_ptr, coeff_,
+                               diff_size, common_size, swapped, output_ptr);
      }
    }