Merge pull request #1339 from qnqinan/develop

fix bugs for FPGA v2 track

Merge pull request #1339 from qnqinan/develop
fix bugs for FPGA v2 track
2f04b124 · zhangyang0701 · GitHub · defbd4f9 · cebe2e39 · 2f04b124
隐藏空白更改
内联并排

Showing with 2 addition and 2 deletion

src/fpga/V2/api.cpp src/fpga/V2/api.cpp +1 -1

src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp +1 -1

未找到文件。
--- a/src/fpga/V2/api.cpp
+++ b/src/fpga/V2/api.cpp
@@ -214,7 +214,7 @@ void fill_split_arg(struct SplitConvArgs *arg, framework::Tensor *input,
    arg->conv_arg[i].output.scale_address = out->scale;
    int num_after_alignment = filter::calc_aligned_num(
-        (int)input->dims()[1], arg->filter_num);  // NOLINT
+        arg->filter_num, (int)input->dims()[1]);  // NOLINT
    arg->conv_arg[i].free_space =
        fpga_malloc(num_after_alignment * 2 * sizeof(half));
  }

--- a/src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp
+++ b/src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp
@@ -21,7 +21,7 @@ namespace operators {
 template <>
 bool ElementwiseAddReluKernel<FPGA, float>::Init(
    ElementwiseAddReluParam<FPGA> *param) {
-  bool relu_enabled = false;
+  bool relu_enabled = true;
  auto *input_x = const_cast<LoDTensor *>(param->InputX());
  auto *input_y = const_cast<LoDTensor *>(param->InputY());
  auto *out = param->Out();