Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
magicwindyyd
mindspore
提交
1d078329
M
mindspore
项目概览
magicwindyyd
/
mindspore
与 Fork 源项目一致
Fork自
MindSpore / mindspore
通知
1
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
M
mindspore
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
提交
1d078329
编写于
6月 17, 2020
作者:
L
lvliang
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
merge-pynative-and-static-memory-into-mempool
上级
51f8ffab
变更
10
显示空白变更内容
内联
并排
Showing
10 changed file
with
125 addition
and
49 deletion
+125
-49
mindspore/ccsrc/device/ascend/ascend_device_address.cc
mindspore/ccsrc/device/ascend/ascend_device_address.cc
+11
-1
mindspore/ccsrc/device/ascend/ascend_device_address.h
mindspore/ccsrc/device/ascend/ascend_device_address.h
+2
-0
mindspore/ccsrc/device/ascend/ascend_memory_manager.cc
mindspore/ccsrc/device/ascend/ascend_memory_manager.cc
+61
-18
mindspore/ccsrc/device/ascend/ascend_memory_manager.h
mindspore/ccsrc/device/ascend/ascend_memory_manager.h
+5
-0
mindspore/ccsrc/device/ascend/ascend_memory_pool.cc
mindspore/ccsrc/device/ascend/ascend_memory_pool.cc
+25
-16
mindspore/ccsrc/device/ascend/ascend_memory_pool.h
mindspore/ccsrc/device/ascend/ascend_memory_pool.h
+5
-11
mindspore/ccsrc/device/device_address.h
mindspore/ccsrc/device/device_address.h
+1
-0
mindspore/ccsrc/device/kernel_runtime.cc
mindspore/ccsrc/device/kernel_runtime.cc
+10
-0
mindspore/ccsrc/device/memory_manager.h
mindspore/ccsrc/device/memory_manager.h
+1
-1
mindspore/ccsrc/pre_activate/mem_reuse/mem_dynamic_allocator.cc
...ore/ccsrc/pre_activate/mem_reuse/mem_dynamic_allocator.cc
+4
-2
未找到文件。
mindspore/ccsrc/device/ascend/ascend_device_address.cc
浏览文件 @
1d078329
...
...
@@ -303,12 +303,22 @@ bool AscendDeviceAddress::ConvertFormatAndSyncHostToDevice(const std::vector<int
return
sync_ok
;
}
void
AscendDeviceAddress
::
UpdateCommunicationAddress
()
{
MS_EXCEPTION_IF_NULL
(
ptr_
);
communication_ptr_
=
reinterpret_cast
<
uint8_t
*>
(
ptr_
)
-
kMemAlignSize
;
}
AscendDeviceAddress
::~
AscendDeviceAddress
()
{
if
(
ptr_
==
nullptr
)
{
return
;
}
if
(
from_mem_pool_
)
{
if
(
communication_ptr_
!=
nullptr
)
{
AscendMemoryPool
::
GetInstance
().
FreeTensorMem
(
communication_ptr_
);
communication_ptr_
=
nullptr
;
}
else
{
AscendMemoryPool
::
GetInstance
().
FreeTensorMem
(
ptr_
);
}
ptr_
=
nullptr
;
}
}
...
...
mindspore/ccsrc/device/ascend/ascend_device_address.h
浏览文件 @
1d078329
...
...
@@ -39,6 +39,7 @@ class AscendDeviceAddress : public DeviceAddress {
bool
SyncDeviceToHost
(
const
std
::
vector
<
int
>
&
shape
,
size_t
size
,
TypeId
type
,
void
*
host_ptr
)
const
override
;
bool
SyncHostToDevice
(
const
std
::
vector
<
int
>
&
shape
,
size_t
size
,
TypeId
type
,
const
void
*
host_ptr
)
const
override
;
DeviceAddressType
DeviceType
()
const
override
{
return
DeviceAddressType
::
kAscend
;
}
void
UpdateCommunicationAddress
()
override
;
#ifdef ENABLE_DUMP_E2E
bool
DumpMemToFile
(
bool
dump_mode
,
const
std
::
string
&
filepath
,
const
std
::
string
&
host_fmt
,
const
std
::
vector
<
int
>
&
host_shape
,
TypeId
host_type
)
const
;
...
...
@@ -53,6 +54,7 @@ class AscendDeviceAddress : public DeviceAddress {
bool
ConvertFormatAndSyncHostToDevice
(
const
std
::
vector
<
int
>
&
shape
,
size_t
size
,
TypeId
type
,
const
void
*
host_ptr
)
const
;
void
SyncStream
()
const
;
uint8_t
*
communication_ptr_
{
nullptr
};
};
using
AscendDeviceAddressPtr
=
std
::
shared_ptr
<
AscendDeviceAddress
>
;
}
// namespace ascend
...
...
mindspore/ccsrc/device/ascend/ascend_memory_manager.cc
浏览文件 @
1d078329
...
...
@@ -21,31 +21,22 @@
namespace
mindspore
{
namespace
device
{
namespace
ascend
{
constexpr
uint64_t
kAscendDeviceMemGB
=
26
;
constexpr
uint64_t
kAscendMemPoolGB
=
4
;
constexpr
uint64_t
kAscendDeviceMemGB
=
30
;
constexpr
uint64_t
kMemSizeGB
=
30
;
constexpr
uint64_t
kMaxMemSizeGB
=
30
;
constexpr
uint64_t
kAscendDeviceMemSize
=
(
kAscendDeviceMemGB
<<
kMemSizeGB
);
constexpr
uint64_t
kAscendMemPoolSize
=
(
kAscendMemPoolGB
<<
kMemSizeGB
);
void
AscendMemoryManager
::
MallocDeviceMemory
()
{
auto
context_mem
=
GetDeviceMemSizeFromContext
();
device_mem_size_
=
context_mem
==
0
?
kAscendDeviceMemSize
:
context_mem
;
static_mem_offset_
=
device_mem_size_
;
auto
ret
=
rtMalloc
(
reinterpret_cast
<
void
**>
(
&
device_mem_base_
),
static_mem_offset_
,
RT_MEMORY_HBM
);
if
(
ret
!=
RT_ERROR_NONE
)
{
MS_EXCEPTION
(
DeviceProcessError
)
<<
"rtMalloc mem size["
<<
static_mem_offset_
<<
"] fail, ret["
<<
ret
<<
"]"
;
}
dynamic_mem_offset_
=
device_mem_size_
;
auto
ret
=
rtMalloc
(
reinterpret_cast
<
void
**>
(
&
device_mem_base_
),
dynamic_mem_offset_
,
RT_MEMORY_HBM
);
if
(
context_mem
==
0
)
{
device_mem_pool_size_
=
kAscendMemPoolSize
;
ret
=
rtMalloc
(
reinterpret_cast
<
void
**>
(
&
device_mem_pool_base_
),
device_mem_pool_size_
,
RT_MEMORY_HBM
);
if
(
ret
!=
RT_ERROR_NONE
)
{
MS_EXCEPTION
(
DeviceProcessError
)
<<
"rtMalloc mem size["
<<
device_mem_pool_size_
<<
"] fail, ret["
<<
ret
<<
"]"
;
}
AscendMemoryPool
::
GetInstance
().
set_device_mem_pool_base
(
device_mem_pool_base_
);
AscendMemoryPool
::
GetInstance
().
set_device_mem_pool_size
(
device_mem_pool_size_
);
MS_EXCEPTION
(
DeviceProcessError
)
<<
"rtMalloc mem size["
<<
dynamic_mem_offset_
<<
"] fail, ret["
<<
ret
<<
"]"
;
}
AscendMemoryPool
::
GetInstance
().
set_device_mem_pool_base
(
device_mem_base_
);
AscendMemoryPool
::
GetInstance
().
set_graph_dynamic_mem_offset
(
dynamic_mem_offset_
);
}
uint64_t
AscendMemoryManager
::
GetDeviceMemSizeFromContext
()
{
...
...
@@ -63,7 +54,7 @@ uint64_t AscendMemoryManager::GetDeviceMemSizeFromContext() {
auto
gb_str
=
variable_memory_max_size
.
substr
(
0
,
pos
);
auto
gb_var
=
std
::
stoull
(
gb_str
);
MS_LOG
(
INFO
)
<<
"variable_memory_max_size(GB):"
<<
gb_var
;
if
(
gb_var
>
k
MaxMemSize
GB
||
gb_var
==
0
)
{
if
(
gb_var
>
k
AscendDeviceMem
GB
||
gb_var
==
0
)
{
MS_LOG
(
EXCEPTION
)
<<
"Invalid allocate memory size:"
<<
gb_var
<<
" which should be in (0-30]GB"
;
}
return
gb_var
<<
kMemSizeGB
;
...
...
@@ -86,8 +77,60 @@ void AscendMemoryManager::FreeDeviceMemory() {
}
}
void
AscendMemoryManager
::
ResetDynamicMemory
()
{
total_dynamic_size_
=
0
;
dynamic_mem_offset_
=
device_mem_size_
;
AscendMemoryPool
::
GetInstance
().
set_graph_dynamic_mem_offset
(
dynamic_mem_offset_
);
}
void
*
AscendMemoryManager
::
MallocMemFromMemPool
(
size_t
size
)
{
return
AscendMemoryPool
::
GetInstance
().
AllocTensorMem
(
size
);
auto
align_size
=
GetCommonAlignSize
(
size
);
return
AscendMemoryPool
::
GetInstance
().
AllocTensorMem
(
align_size
);
}
uint8_t
*
AscendMemoryManager
::
MallocStaticMem
(
size_t
size
,
bool
communication_mem
)
{
size_t
align_size
=
0
;
if
(
communication_mem
)
{
align_size
=
GetCommunicationAlignSize
(
size
);
}
else
{
align_size
=
GetCommonAlignSize
(
size
);
}
if
(
communication_mem
)
{
// create protect area [kMemAlignSize -- data -- kMemAlignSize]
uint8_t
*
alloc_address
=
reinterpret_cast
<
uint8_t
*>
(
AscendMemoryPool
::
GetInstance
().
AllocTensorMem
(
align_size
));
return
alloc_address
+
kMemAlignSize
;
}
else
{
return
reinterpret_cast
<
uint8_t
*>
(
AscendMemoryPool
::
GetInstance
().
AllocTensorMem
(
align_size
));
}
}
uint8_t
*
AscendMemoryManager
::
MallocDynamicMem
(
size_t
size
,
bool
communication_mem
)
{
size_t
align_size
=
0
;
if
(
communication_mem
)
{
align_size
=
GetCommunicationAlignSize
(
size
);
}
else
{
align_size
=
GetCommonAlignSize
(
size
);
}
if
(
dynamic_mem_offset_
<
align_size
)
{
MS_LOG
(
EXCEPTION
)
<<
"Out of memory!!! total["
<<
device_mem_size_
<<
"] (dynamic["
<<
total_dynamic_size_
<<
"]) malloc ["
<<
align_size
<<
"] failed!"
;
}
auto
new_offset
=
dynamic_mem_offset_
-
align_size
;
auto
device_mem_pool_offset
=
AscendMemoryPool
::
GetInstance
().
device_mem_pool_offset
();
if
(
new_offset
<=
device_mem_pool_offset
)
{
MS_LOG
(
EXCEPTION
)
<<
"Out of memory!!! total["
<<
device_mem_size_
<<
"] (dynamic["
<<
total_dynamic_size_
<<
"] memory pool["
<<
device_mem_pool_offset
<<
"])"
<<
" malloc ["
<<
align_size
<<
"] failed!"
;
}
total_dynamic_size_
+=
align_size
;
dynamic_mem_offset_
=
new_offset
;
AscendMemoryPool
::
GetInstance
().
set_graph_dynamic_mem_offset
(
dynamic_mem_offset_
);
if
(
communication_mem
)
{
// create protect area [kMemAlignSize -- data -- kMemAlignSize]
return
device_mem_base_
+
new_offset
+
kMemAlignSize
;
}
else
{
return
device_mem_base_
+
new_offset
;
}
}
}
// namespace ascend
}
// namespace device
...
...
mindspore/ccsrc/device/ascend/ascend_memory_manager.h
浏览文件 @
1d078329
...
...
@@ -27,8 +27,13 @@ class AscendMemoryManager : public MemoryManager {
void
MallocDeviceMemory
()
override
;
void
FreeDeviceMemory
()
override
;
void
ResetDynamicMemory
()
override
;
void
*
MallocMemFromMemPool
(
size_t
size
)
override
;
protected:
uint8_t
*
MallocStaticMem
(
size_t
size
,
bool
communication_mem
)
override
;
uint8_t
*
MallocDynamicMem
(
size_t
size
,
bool
communication_mem
)
override
;
private:
uint8_t
*
device_mem_pool_base_
{
nullptr
};
uint64_t
device_mem_pool_size_
{
0
};
...
...
mindspore/ccsrc/device/ascend/ascend_memory_pool.cc
浏览文件 @
1d078329
...
...
@@ -22,45 +22,54 @@ namespace mindspore {
namespace
device
{
namespace
ascend
{
size_t
AscendMemoryPool
::
AllocDeviceMem
(
size_t
size
,
DeviceMemPtr
*
addr
)
{
if
(
has_malloc_
)
{
MS_LOG
(
EXCEPTION
)
<<
"
Has alloc memory pool memory
!"
;
if
(
size
==
0
)
{
MS_LOG
(
EXCEPTION
)
<<
"
Can not alloc memory size(0) in memory pool
!"
;
}
if
(
size
==
0
||
size
>
free_mem_size_
)
{
MS_LOG
(
EXCEPTION
)
<<
"Failed to alloc memory pool memory !"
;
if
(
device_mem_pool_offset_
+
size
>=
graph_dynamic_mem_offset_
)
{
MS_LOG
(
EXCEPTION
)
<<
"Failed to alloc memory pool memory, the current device_mem_pool_offset_ ["
<<
device_mem_pool_offset_
<<
"], current graph_dynamic_mem_offset_ "
<<
graph_dynamic_mem_offset_
<<
"], need memory size ["
<<
size
<<
"]"
;
}
*
addr
=
device_mem_pool_base_
;
*
addr
=
device_mem_pool_base_
+
device_mem_pool_offset_
;
device_mem_pool_offset_
+=
size
;
if
(
*
addr
==
nullptr
)
{
MS_LOG
(
EXCEPTION
)
<<
"
Device memory pool base
is nullptr, failed to alloc memory pool memory!"
;
MS_LOG
(
EXCEPTION
)
<<
"
Alloc device address
is nullptr, failed to alloc memory pool memory!"
;
}
has_malloc_
=
true
;
free_mem_size_
-=
size
;
return
size
;
}
bool
AscendMemoryPool
::
FreeDeviceMem
(
const
DeviceMemPtr
&
addr
)
{
MS_EXCEPTION_IF_NULL
(
addr
);
has_malloc_
=
false
;
free_mem_size_
=
total_mem_size_
;
return
true
;
}
size_t
AscendMemoryPool
::
AlignMemorySize
(
size_t
size
)
const
{
if
(
size
==
0
)
{
return
DYNAMIC_MEM_ALIGN_SIZE
;
MS_LOG
(
EXCEPTION
)
<<
"The align memory size is a zero !"
;
}
return
((
size
+
DYNAMIC_MEM_ALIGN_SIZE
+
31
)
/
DYNAMIC_MEM_ALIGN_SIZE
)
*
DYNAMIC_MEM_ALIGN_SIZE
;
return
size
;
}
size_t
AscendMemoryPool
::
mem_alloc_unit_size
()
const
{
return
free_mem_size_
-
512
;
}
void
AscendMemoryPool
::
set_device_mem_pool_base
(
uint8_t
*
device_mem_pool_base
)
{
MS_EXCEPTION_IF_NULL
(
device_mem_pool_base
);
device_mem_pool_base_
=
device_mem_pool_base
;
}
size_t
AscendMemoryPool
::
free_mem_size
()
{
return
free_mem_size_
;
}
void
AscendMemoryPool
::
set_graph_dynamic_mem_offset
(
uint64_t
graph_dynamic_mem_offset
)
{
graph_dynamic_mem_offset_
=
graph_dynamic_mem_offset
;
}
uint64_t
AscendMemoryPool
::
device_mem_pool_offset
()
const
{
return
device_mem_pool_offset_
;
}
size_t
AscendMemoryPool
::
free_mem_size
()
{
if
(
graph_dynamic_mem_offset_
<
device_mem_pool_offset_
)
{
MS_LOG
(
EXCEPTION
)
<<
"graph dynamic mem offset ["
<<
graph_dynamic_mem_offset_
<<
"] less than device mem pool offset ["
<<
device_mem_pool_offset_
<<
"]!"
;
}
return
graph_dynamic_mem_offset_
-
device_mem_pool_offset_
;
}
size_t
AscendMemoryPool
::
total_mem_size
()
{
return
total_mem_size_
;
}
size_t
AscendMemoryPool
::
total_mem_size
()
{
return
graph_dynamic_mem_offset_
==
0
?
0
:
graph_dynamic_mem_offset_
-
1
;
}
}
// namespace ascend
}
// namespace device
}
// namespace mindspore
mindspore/ccsrc/device/ascend/ascend_memory_pool.h
浏览文件 @
1d078329
...
...
@@ -32,11 +32,9 @@ class AscendMemoryPool : public DynamicMemPoolBestFit {
size_t
AllocDeviceMem
(
size_t
size
,
DeviceMemPtr
*
addr
)
override
;
bool
FreeDeviceMem
(
const
DeviceMemPtr
&
addr
)
override
;
void
set_device_mem_pool_base
(
uint8_t
*
device_mem_pool_base
);
void
set_device_mem_pool_size
(
uint64_t
device_mem_pool_size
)
{
device_mem_pool_size_
=
device_mem_pool_size
;
free_mem_size_
=
device_mem_pool_size_
;
total_mem_size_
=
free_mem_size_
;
}
void
set_graph_dynamic_mem_offset
(
uint64_t
graph_dynamic_mem_offset
);
uint64_t
device_mem_pool_offset
()
const
;
size_t
free_mem_size
()
override
;
size_t
total_mem_size
()
override
;
...
...
@@ -48,16 +46,12 @@ class AscendMemoryPool : public DynamicMemPoolBestFit {
protected:
// The real size by memory alloc aligned.
size_t
AlignMemorySize
(
size_t
size
)
const
override
;
// Get the minimum memory unit size using for dynamic extend.
size_t
mem_alloc_unit_size
()
const
override
;
private:
AscendMemoryPool
()
=
default
;
bool
has_malloc_
{
false
};
uint8_t
*
device_mem_pool_base_
{
nullptr
};
uint64_t
device_mem_pool_size_
{
0
};
size_t
free_mem_size_
{
0
};
size_t
total_mem_size_
{
0
};
uint64_t
device_mem_pool_offset_
{
0
};
uint64_t
graph_dynamic_mem_offset_
{
0
};
};
}
// namespace ascend
}
// namespace device
...
...
mindspore/ccsrc/device/device_address.h
浏览文件 @
1d078329
...
...
@@ -64,6 +64,7 @@ class DeviceAddress {
std
::
string
format
()
const
{
return
format_
;
}
TypeId
type_id
()
const
{
return
type_id_
;
}
void
set_host_shape
(
const
std
::
vector
<
int
>
&
shape
)
{
host_shape_
=
shape
;
}
virtual
void
UpdateCommunicationAddress
()
{}
virtual
void
set_status
(
DeviceAddressStatus
status
)
{}
virtual
DeviceAddressStatus
status
()
const
{
return
DeviceAddressStatus
::
kInDevice
;
}
virtual
DeviceAddressType
DeviceType
()
const
{
return
DeviceAddressType
::
kUnknown
;
}
...
...
mindspore/ccsrc/device/kernel_runtime.cc
浏览文件 @
1d078329
...
...
@@ -431,6 +431,10 @@ void KernelRuntime::AssignCommunicationNodeOutputMem(int flag, const AnfNodePtr
std
::
string
output_format
=
AnfAlgo
::
GetOutputFormat
(
node
,
j
);
auto
output_type
=
AnfAlgo
::
GetOutputDeviceDataType
(
node
,
j
);
auto
address
=
CreateDeviceAddress
(
output_ptr
,
output_sizes
[
j
],
output_format
,
output_type
);
MS_EXCEPTION_IF_NULL
(
address
);
if
(
AnfAlgo
::
IsCommunicationOp
(
node
)
&&
context_ptr
->
enable_hccl
())
{
address
->
UpdateCommunicationAddress
();
}
AnfAlgo
::
SetOutputAddr
(
address
,
j
,
node
.
get
());
output_ptr
+=
align_size_list
[
j
];
}
...
...
@@ -480,6 +484,8 @@ void KernelRuntime::AssignCommunicationNodeInputMem(const AnfNodePtr &node) {
}
void
KernelRuntime
::
AssignNodeOutputMem
(
int
flag
,
const
AnfNodePtr
&
node
,
int
index
)
{
auto
context_ptr
=
MsContext
::
GetInstance
();
MS_EXCEPTION_IF_NULL
(
context_ptr
);
MS_EXCEPTION_IF_NULL
(
node
);
MS_EXCEPTION_IF_NULL
(
mem_manager_
);
if
(
AnfAlgo
::
IsGetNext
(
NOT_NULL
(
node
))
&&
flag
==
kReuseDynamicMem
)
{
...
...
@@ -509,7 +515,11 @@ void KernelRuntime::AssignNodeOutputMem(int flag, const AnfNodePtr &node, int in
std
::
string
output_format
=
AnfAlgo
::
GetOutputFormat
(
node
,
i
);
auto
output_type
=
AnfAlgo
::
GetOutputDeviceDataType
(
node
,
i
);
auto
device_address
=
CreateDeviceAddress
(
ptr
,
output_sizes
[
i
],
output_format
,
output_type
);
MS_EXCEPTION_IF_NULL
(
device_address
);
device_address
->
set_host_shape
(
trans
::
GetRuntimePaddingShape
(
node
,
i
));
if
(
AnfAlgo
::
IsCommunicationOp
(
node
)
&&
context_ptr
->
enable_hccl
())
{
device_address
->
UpdateCommunicationAddress
();
}
AnfAlgo
::
SetOutputAddr
(
device_address
,
i
,
node
.
get
());
}
}
...
...
mindspore/ccsrc/device/memory_manager.h
浏览文件 @
1d078329
...
...
@@ -36,7 +36,7 @@ class MemoryManager {
virtual
void
MallocDeviceMemory
()
=
0
;
virtual
void
FreeDeviceMemory
()
=
0
;
void
ResetDynamicMemory
()
{
v
irtual
v
oid
ResetDynamicMemory
()
{
total_dynamic_size_
=
0
;
dynamic_mem_offset_
=
0
;
}
...
...
mindspore/ccsrc/pre_activate/mem_reuse/mem_dynamic_allocator.cc
浏览文件 @
1d078329
...
...
@@ -184,14 +184,16 @@ DynamicMemBlockPtr DynamicMemPoolBestFit::FindMemBlock(const DeviceMemPtr device
if
(
iter
!=
global_mem_block_list_
.
begin
())
{
return
*
(
--
iter
);
}
MS_LOG
(
ERROR
)
<<
"Can't find the mem_block of the device address["
<<
device_addr
<<
"]."
;
return
nullptr
;
}
void
DynamicMemPoolBestFit
::
FreeTensorMem
(
const
DeviceMemPtr
device_addr
)
{
MS_EXCEPTION_IF_NULL
(
device_addr
);
auto
mem_block
=
FindMemBlock
(
device_addr
);
MS_EXCEPTION_IF_NULL
(
mem_block
);
if
(
mem_block
==
nullptr
)
{
MS_LOG
(
WARNING
)
<<
"Can't find the mem_block of the device address["
<<
device_addr
<<
"]."
;
return
;
}
CombineMemBuf
(
mem_block
,
device_addr
);
}
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录