Fix the MLP output tensor's shape (#2380)

0a2ae2ef · Arash Bakhtiari · GitHub · ff427438 · 0a2ae2ef
隐藏空白更改
内联并排

Showing with 5 addition and 5 deletion

csrc/transformer/inference/csrc/pt_binding.cpp csrc/transformer/inference/csrc/pt_binding.cpp +5 -5

未找到文件。
--- a/csrc/transformer/inference/csrc/pt_binding.cpp
+++ b/csrc/transformer/inference/csrc/pt_binding.cpp
@@ -1083,8 +1083,8 @@ template <typename T>
 std::vector<at::Tensor> ds_mlp_gemm(at::Tensor& input,
                                    at::Tensor& residual,
                                    at::Tensor& input_bias,
-                                    at::Tensor& weight,
+                                    at::Tensor& weight_interm,
-                                    at::Tensor& weight1,
+                                    at::Tensor& weight_out,
                                    at::Tensor& bias,
                                    at::Tensor& gamma,
                                    at::Tensor& beta,
@@ -1102,7 +1102,7 @@ std::vector<at::Tensor> ds_mlp_gemm(at::Tensor& input,
                       .device(at::kCUDA)
                       .requires_grad(false);
-    int out_size = q_int8 ? weight.size(0) : weight.size(1);
+    int out_size = q_int8 ? weight_out.size(0) : weight_out.size(1);
    auto output = at::from_blob((T*)Context::Instance().GetWorkSpace() + torch::numel(input),
                                {input.size(0), input.size(1), out_size},
                                options);
@@ -1113,8 +1113,8 @@ std::vector<at::Tensor> ds_mlp_gemm(at::Tensor& input,
                                         mlp_after_attn ? input : residual,
                                         residual,
                                         input_bias,
-                                         weight,
+                                         weight_interm,
-                                         weight1,
+                                         weight_out,
                                         bias,
                                         gamma,
                                         beta,