remove multiplication from transpose

8fc1dd76 · dolphin8 · 4cfd981a · 8fc1dd76
隐藏空白更改
内联并排

Showing with 3 addition and 1 deletion

src/operators/kernel/arm/transpose_kernel.cpp src/operators/kernel/arm/transpose_kernel.cpp +3 -1

未找到文件。
--- a/src/operators/kernel/arm/transpose_kernel.cpp
+++ b/src/operators/kernel/arm/transpose_kernel.cpp
@@ -47,6 +47,7 @@ void TransposeKernel<CPU, float>::Compute(const TransposeParam& param) const {
  size_t ndim = axis.size();
  std::vector<int> xdim(ndim);
  std::vector<int> xstride(ndim);
+  std::vector<int> xout(ndim);
  for (int i = 0; i < ndim; i++) {
    int j = ndim - 1 - i;
    xdim[j] = input_x_dims[axis[i]];
@@ -54,6 +55,7 @@ void TransposeKernel<CPU, float>::Compute(const TransposeParam& param) const {
    for (int k = axis[i] + 1; k < ndim; k++) {
      xstride[j] *= input_x_dims[k];
    }
+    xout[j] = xstride[j] * xdim[j];
  }

  auto numel = input_x->numel();
@@ -68,7 +70,7 @@ void TransposeKernel<CPU, float>::Compute(const TransposeParam& param) const {
        ind[j + 1]++;
        ind[j] = 0;
        pind += xstride[j + 1];
-        pind -= xdim[j] * xstride[j];
+        pind -= xout[j];
      } else {
        break;
      }