diff --git a/paddle/fluid/operators/optimizers/adam_op.h b/paddle/fluid/operators/optimizers/adam_op.h index f8c7b82053a113ad9c869a54efe955e81f8b1f66..6b794e0d3e0d0d66132883e954057076e978d600 100644 --- a/paddle/fluid/operators/optimizers/adam_op.h +++ b/paddle/fluid/operators/optimizers/adam_op.h @@ -509,6 +509,7 @@ class AdamOpKernel : public framework::OpKernel { for (size_t i = 0; i < fs.size(); ++i) fs[i].wait(); } else { if (lazy_mode) { + VLOG(3) << "run cpu lazy mode"; size_t row_count = grad_merge.rows().size(); std::vector cpu_rows(grad_merge.rows()); for (size_t row_index = 0; row_index < row_count; ++row_index) {