提交 4dc50007 编写于 作者: W wuzewu

Fixed the issue that the model does not support training in multi-card scene.

上级 595f4534
...@@ -18,8 +18,8 @@ import time ...@@ -18,8 +18,8 @@ import time
from collections import defaultdict from collections import defaultdict
from typing import Any, Callable, Generic, List from typing import Any, Callable, Generic, List
import numpy as np
import paddle import paddle
import numpy as np
from visualdl import LogWriter from visualdl import LogWriter
from paddlehub.utils.log import logger from paddlehub.utils.log import logger
...@@ -82,6 +82,7 @@ class Trainer(object): ...@@ -82,6 +82,7 @@ class Trainer(object):
if self.nranks > 1: if self.nranks > 1:
paddle.distributed.init_parallel_env() paddle.distributed.init_parallel_env()
self.model = paddle.DataParallel(self.model) self.model = paddle.DataParallel(self.model)
self.compare_metrics = self._compare_metrics if not compare_metrics else compare_metrics self.compare_metrics = self._compare_metrics if not compare_metrics else compare_metrics
self._load_checkpoint() self._load_checkpoint()
...@@ -178,8 +179,14 @@ class Trainer(object): ...@@ -178,8 +179,14 @@ class Trainer(object):
collate_fn(callable): function to generate mini-batch data by merging the sample list. collate_fn(callable): function to generate mini-batch data by merging the sample list.
None for only stack each fields of sample in axis 0(same as :attr::`np.stack(..., axis=0)`). Default None None for only stack each fields of sample in axis 0(same as :attr::`np.stack(..., axis=0)`). Default None
''' '''
if eval_dataset is not None and not hasattr(self.model, 'validation_step'): if eval_dataset is not None:
raise NotImplementedError('The specified finetuning model does not support evaluation.') if isinstance(self.model, paddle.DataParallel):
model = self.model._layers
else:
model = self.model
if not hasattr(model, 'validation_step'):
raise NotImplementedError('The specified finetuning model does not support evaluation.')
batch_sampler = paddle.io.DistributedBatchSampler( batch_sampler = paddle.io.DistributedBatchSampler(
train_dataset, batch_size=batch_size, shuffle=True, drop_last=False) train_dataset, batch_size=batch_size, shuffle=True, drop_last=False)
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册