profiler.h 1.8 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22
// Copyright (c) 2021 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#pragma once
#include "paddle/fluid/framework/tensor.h"
#include "paddle/fluid/framework/variable.h"
#include "paddle/fluid/platform/gpu_info.h"
#include "paddle/fluid/platform/timer.h"

namespace paddle {
namespace framework {
23
namespace interpreter {
24
struct CostInfo {
25 26
  double total_time{0.};          // ms
  size_t device_memory_bytes{0};  // total allocated memory size
27 28
};

29
class ProfilerGuard {
30
 public:
31 32 33
  ProfilerGuard(const platform::Place& place, CostInfo* cost_info)
      : place_(place), cost_info_(cost_info) {
    timer_.Start();
34 35
  }

36 37 38 39
  ~ProfilerGuard() {
    timer_.Pause();
    cost_info_->total_time += timer_.ElapsedMS();
    TotalCUDAAllocatedMemorySize(place_);
40 41
  }

42
 private:
43 44 45 46
  void TotalCUDAAllocatedMemorySize(const platform::Place& place) {
    if (platform::is_gpu_place(place)) {
#if defined(PADDLE_WITH_CUDA) || defined(PADDLE_WITH_HIP)
      auto cuda_place = BOOST_GET_CONST(platform::CUDAPlace, place);
47
      cost_info_->device_memory_bytes =
48 49 50 51 52
          platform::RecordedCudaMallocSize(cuda_place.device);
#endif
    }
  }

53 54
  const platform::Place& place_;
  CostInfo* cost_info_;
55 56
  platform::Timer timer_;
};
57 58

}  // namespace interpreter
59 60
}  // namespace framework
}  // namespace paddle