diff --git a/src/fpga/V2/api.cpp b/src/fpga/V2/api.cpp index d58e780c279e03b90b4ebe3731c6693615107ec4..daf8c72b8338d483dc4401c713fa7956e1b2bc1b 100644 --- a/src/fpga/V2/api.cpp +++ b/src/fpga/V2/api.cpp @@ -214,7 +214,7 @@ void fill_split_arg(struct SplitConvArgs *arg, framework::Tensor *input, arg->conv_arg[i].output.scale_address = out->scale; int num_after_alignment = filter::calc_aligned_num( - (int)input->dims()[1], arg->filter_num); // NOLINT + arg->filter_num, (int)input->dims()[1]); // NOLINT arg->conv_arg[i].free_space = fpga_malloc(num_after_alignment * 2 * sizeof(half)); } diff --git a/src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp b/src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp index 571987b3bf2a88c0d4ad648c7cb1966b538983a5..f74b188b56b0fa1360f6a6a728c415f67b95b9a9 100644 --- a/src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp +++ b/src/operators/kernel/fpga/V2/elementwise_add_relu_kernel.cpp @@ -21,7 +21,7 @@ namespace operators { template <> bool ElementwiseAddReluKernel::Init( ElementwiseAddReluParam *param) { - bool relu_enabled = false; + bool relu_enabled = true; auto *input_x = const_cast(param->InputX()); auto *input_y = const_cast(param->InputY()); auto *out = param->Out();