"fix error"

73883bde · Dong Zhihong · d4d215a5 · 73883bde
隐藏空白更改
内联并排

Showing with 7 addition and 4 deletion

paddle/operators/nccl/nccl_ops.h paddle/operators/nccl/nccl_ops.h +7 -4

未找到文件。
--- a/paddle/operators/nccl/nccl_ops.h
+++ b/paddle/operators/nccl/nccl_ops.h
@@ -7,6 +7,8 @@
 namespace paddle {
 namespace operators {

+using framework::Tensor;
+
 template <typename Type>
 class NCCLTypeWrapper;

@@ -21,7 +23,7 @@ class NCCLTypeWrapper<double> {
 };

 template <typename T>
-class NCCLAllReduceKernel : public framework::OpKernel {
+class NCCLAllReduceKernel : public framework::OpKernel<T> {
 public:
  void Compute(const framework::ExecutionContext& ctx) const override {
    auto ins = ctx.MultiInput<Tensor>("X");
@@ -35,13 +37,14 @@ class NCCLAllReduceKernel : public framework::OpKernel {
      op_type = ncclProd;
    } else if (reduction == "ncclMin") {
      op_type = ncclMin;
-    } else
-      (reduction == "ncclMax") { op_type = ncclMax; }
+    } else if (reduction == "ncclMax") {
+      op_type = ncclMax;
+    }

    auto dev_ctx =
        static_cast<const platform::CUDADeviceContext>(ctx.device_context());

-    NCCLManager* m = NCCLManager::Get();
+    platform::NCCLManager* m = platform::NCCLManager::Get();

    auto* comm = m->GetCommunicator(gpus);
    comm->wg_.Add(1);