提交 3a4c28fa 编写于 作者: L lizhenyu

change directory of akg cuda kernel

上级 a62c3e5c
......@@ -24,13 +24,13 @@ import _akg
from _akg import save_gpu_param as gpu_utils
from _akg.utils import validation_check as vc_util
MS_CUDA_KERNEL_PATH = "/tmp/cuda_meta/"
@vc_util.check_input_type(list, (list, tuple), (list, tuple), (types.FunctionType, type(None)), str, str, dict)
def op_build(opnames, computes, args, custom_schedule, device, kernel_name, attrs):
"""op_build"""
kernel_meta_path = "./cuda_meta_" + str(os.getpid()) + "/"
if device == "cuda":
cuda_path = os.path.realpath(MS_CUDA_KERNEL_PATH)
cuda_path = os.path.realpath(kernel_meta_path)
if not os.path.isdir(cuda_path):
os.makedirs(cuda_path)
if not opnames:
......@@ -43,7 +43,7 @@ def op_build(opnames, computes, args, custom_schedule, device, kernel_name, attr
logging.error("no schedule func found %s", str(schedule_name))
return None
ptx_file = os.path.realpath(MS_CUDA_KERNEL_PATH + kernel_name + ".ptx")
ptx_file = os.path.realpath(kernel_meta_path + kernel_name + ".ptx")
if os.path.exists(ptx_file):
os.chmod(ptx_file, 0o600)
try:
......@@ -55,7 +55,8 @@ def op_build(opnames, computes, args, custom_schedule, device, kernel_name, attr
foo = _akg.tvm.build(s, args, device, name=kernel_name)
ptx_code = foo.imported_modules[0].get_source("ptx")
file.write(ptx_code)
json_file = os.path.realpath(MS_CUDA_KERNEL_PATH + kernel_name + ".json")
json_file = os.path.realpath(
kernel_meta_path + kernel_name + ".json")
kernel_info = (ptx_code, json_file, kernel_name)
gpu_utils.save_gpu_params(s, args, kernel_info)
os.chmod(ptx_file, 0o400)
......
......@@ -28,11 +28,7 @@ namespace gpu {
namespace py = pybind11;
void GpuBuild(const KernelGraphPtr &kernel_graph) {
kernel::KernelMeta *bin_map = kernel::KernelMeta::GetInstance();
if (!bin_map->ReadIndex(kernel::kGpuKernelMeta)) {
MS_LOG(INFO) << "kernel cache miss, cache directory will be created later.";
} else {
MS_LOG(INFO) << "cache initialize to[" << kernel::kGpuKernelMeta << "].";
}
bin_map->Initialize();
MS_EXCEPTION_IF_NULL(kernel_graph);
auto kernels = kernel_graph->execution_order();
for (const auto &kernel : kernels) {
......
......@@ -27,6 +27,7 @@
#include "device/gpu/gpu_common.h"
#include "common/utils.h"
#include "device/gpu/gpu_memory_manager.h"
#include "kernel/common_utils.h"
namespace mindspore {
namespace device {
......@@ -104,6 +105,7 @@ void GPUKernelRuntime::ReleaseDeviceRes() {
if (mem_manager_ != nullptr) {
mem_manager_->FreeDeviceMemory();
}
kernel::KernelMeta::GetInstance()->RemoveKernelCache();
}
void GPUKernelRuntime::AssignMemory(session::KernelGraph *graph) {
......
......@@ -114,53 +114,35 @@ bool IsAtomicNode(const CNodePtr &kernel_node) {
return atomic_flag;
}
bool KernelMeta::ReadIndex(const std::string &bin_dir) {
DIR *dir = opendir(bin_dir.c_str());
if (dir == nullptr) {
void KernelMeta::Initialize() {
kernel_meta_path_ = std::string(kGpuKernelMeta) + "_" + std::to_string(getpid()) + "/";
// remove old kernel cache
RemoveKernelCache();
#if defined(_WIN32) || defined(_WIN64)
auto ret = mkdir(bin_dir.c_str());
auto ret = mkdir(kernel_meta_path_.c_str());
#else
auto ret = mkdir(bin_dir.c_str(), S_IRWXG | S_IRWXU);
auto ret = mkdir(kernel_meta_path_.c_str(), S_IRWXG | S_IRWXU);
#endif
if (ret != 0) {
MS_LOG(INFO) << "kernel dir not exist[" << bin_dir << "].";
return false;
}
dir = opendir(bin_dir.c_str());
if (ret != 0) {
MS_LOG(INFO) << "kernel dir [" << kernel_meta_path_ << "], will be created later";
}
initialized_ = true;
}
struct dirent *entry;
while ((entry = readdir(dir)) != nullptr) {
string bin_dir_tmp = bin_dir;
std::string cce_json = entry->d_name;
if (cce_json.length() <= 5) {
continue;
}
std::string suffix = cce_json.substr(cce_json.length() - 5);
if (suffix != kJsonSuffix) {
continue;
}
auto sp = cce_json.rfind('/');
if (sp != std::string::npos) {
continue;
}
sp = cce_json.rfind('.');
if (sp == std::string::npos) {
continue;
void KernelMeta::RemoveKernelCache() {
if (access(kernel_meta_path_.c_str(), 0) == 0) {
DIR *dir = opendir(kernel_meta_path_.c_str());
MS_EXCEPTION_IF_NULL(dir);
struct dirent *entry;
while ((entry = readdir(dir)) != nullptr) {
std::string kernel_file = entry->d_name;
std::string kernel_file_realpath = kernel_meta_path_ + kernel_file;
(void)remove(kernel_file_realpath.c_str());
}
auto kernel_name = cce_json.substr(0, sp);
(void)bin_dir_tmp.append("/");
(void)bin_dir_tmp.append(cce_json);
kernel_meta_map_[kernel_name] = bin_dir_tmp;
(void)closedir(dir);
(void)rmdir(kernel_meta_path_.c_str());
}
(void)closedir(dir);
MS_LOG(INFO) << "Cache kernel initialized, kernel size[" << kernel_meta_map_.size() << "].";
initialized_ = true;
return true;
}
std::string KernelMeta::Search(const std::string &kernel_name) const {
......@@ -176,11 +158,11 @@ std::string KernelMeta::Search(const std::string &kernel_name) const {
}
}
bool KernelMeta::Insert(const std::string &kernel_name, const std::string &cce_json) {
bool KernelMeta::Insert(const std::string &kernel_name, const std::string &kernel_json) {
if (!initialized_) {
return false;
}
kernel_meta_map_[kernel_name] = cce_json;
kernel_meta_map_[kernel_name] = kernel_json;
return true;
}
......@@ -191,8 +173,8 @@ bool CheckCache(const std::string &kernel_name) {
MS_LOG(DEBUG) << "kernel cache is invalid.";
return false;
}
std::string cce_json = bin_map->Search(kernel_name);
bool ret = (!cce_json.empty());
std::string kernel_json = bin_map->Search(kernel_name);
bool ret = (!kernel_json.empty());
if (ret) {
MS_LOG(INFO) << "Kernel name:" << kernel_name << " has registed.";
} else {
......@@ -209,12 +191,12 @@ KernelPackPtr SearchCache(const std::string &kernel_name, const std::string &pro
return nullptr;
}
std::string cce_json = bin_map->Search(kernel_name);
if (!cce_json.empty()) {
std::string kernel_json = bin_map->Search(kernel_name);
if (!kernel_json.empty()) {
KernelPackPtr kernel_pack = std::make_shared<KernelPack>();
// just a tmp solution.
if (!kernel_pack->ReadFromJsonFile(cce_json, processor)) {
MS_LOG(DEBUG) << "Read cache json and bin file failed[" << cce_json << "].";
if (!kernel_pack->ReadFromJsonFile(kernel_json, processor)) {
MS_LOG(DEBUG) << "Read cache json and bin file failed[" << kernel_json << "].";
return nullptr;
} else {
return kernel_pack;
......@@ -227,26 +209,26 @@ KernelPackPtr SearchCache(const std::string &kernel_name, const std::string &pro
KernelPackPtr InsertCache(const std::string &kernel_name, const std::string &processor) {
MS_LOG(INFO) << "kernel name:" << kernel_name << ", processr:" << processor;
std::string cce_json;
KernelMeta *bin_map = KernelMeta::GetInstance();
std::string kernel_json;
if (processor == kProcessorAiCore || processor == kProcessorAiCpu) {
cce_json = kCceKernelMeta;
kernel_json = kCceKernelMeta;
} else {
cce_json = kGpuKernelMeta;
kernel_json = bin_map->GetKernelMetaPath();
}
(void)cce_json.append(kernel_name).append(kJsonSuffix);
(void)kernel_json.append(kernel_name).append(kJsonSuffix);
KernelPackPtr kernel_pack = std::make_shared<KernelPack>();
if (!kernel_pack->ReadFromJsonFile(cce_json, processor)) {
MS_LOG(DEBUG) << "Read json and bin file failed[" << cce_json << "].";
if (!kernel_pack->ReadFromJsonFile(kernel_json, processor)) {
MS_LOG(DEBUG) << "Read json and bin file failed[" << kernel_json << "].";
return nullptr;
}
KernelMeta *bin_map = KernelMeta::GetInstance();
if (bin_map == nullptr) {
MS_LOG(DEBUG) << "kernel cache is invalid.";
return nullptr;
}
if (bin_map->Insert(kernel_name, cce_json)) {
MS_LOG(INFO) << "Insert to cache success[" << cce_json << "], kernelname[" << kernel_name << "].";
if (bin_map->Insert(kernel_name, kernel_json)) {
MS_LOG(INFO) << "Insert to cache success[" << kernel_json << "], kernelname[" << kernel_name << "].";
}
return kernel_pack;
}
......
......@@ -30,7 +30,7 @@
namespace mindspore {
namespace kernel {
constexpr auto kCceKernelMeta = "./kernel_meta/";
constexpr auto kGpuKernelMeta = "/tmp/cuda_meta/";
constexpr auto kGpuKernelMeta = "./cuda_meta";
constexpr auto kProcessorAiCore = "aicore";
constexpr auto kProcessorAiCpu = "aicpu";
constexpr auto kProcessorCuda = "cuda";
......@@ -51,9 +51,11 @@ using KernelMetaPtr = std::shared_ptr<KernelMetaInfo>;
class KernelMeta {
public:
KernelMeta() = default;
bool ReadIndex(const std::string &bin_dir);
void Initialize();
void RemoveKernelCache();
std::string Search(const std::string &kernel_name) const;
bool Insert(const std::string &kernel_name, const std::string &cce_json);
bool Insert(const std::string &kernel_name, const std::string &kernel_json);
std::string GetKernelMetaPath() { return kernel_meta_path_; }
static KernelMeta *GetInstance() {
static KernelMeta kernel_meta;
......@@ -63,6 +65,7 @@ class KernelMeta {
private:
bool initialized_ = false;
std::string kernel_meta_path_;
std::unordered_map<std::string, std::string> kernel_meta_map_;
};
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册