提交 06a9eeb3 编写于 作者: M mindspore-ci-bot 提交者: Gitee

!1050 [bug][auto_mixed_precision]fix sens shape error of `TrainOneStepWithLossScaleCell`

Merge pull request !1050 from vlne-v1/I1GEPN-check-bprop-error-loss-scale-wrap
......@@ -249,7 +249,9 @@ class TrainOneStepWithLossScaleCell(Cell):
scaling_sens = self.loss_scale
else:
scaling_sens = sens
grads = self.grad(self.network, weights)(data, label, F.cast(scaling_sens, F.dtype(loss)))
scaling_sens_filled = C.ones_like(loss) * F.cast(scaling_sens, F.dtype(loss))
grads = self.grad(self.network, weights)(data, label, scaling_sens_filled)
grads = self.hyper_map(F.partial(_grad_scale, scaling_sens), grads)
# apply grad reducer on grads
grads = self.grad_reducer(grads)
......
......@@ -154,7 +154,8 @@ def build_train_network(network, optimizer, loss_fn=None, level='O0', **kwargs):
loss_scale = loss_scale_manager.get_loss_scale()
update_cell = loss_scale_manager.get_update_cell()
if update_cell is not None:
if not (context.get_context("enable_ge") or (context.get_context("device_target") == "GPU")):
# only cpu not support `TrainOneStepWithLossScaleCell` for control flow.
if not context.get_context("enable_ge") and context.get_context("device_target") == "CPU":
raise ValueError("Only `loss_scale_manager=None` and "
"`loss_scale_manager=FixedLossScaleManager(drop_overflow_update=False)`"
"are supported in current version. If you use `O2` option, please"
......
......@@ -93,7 +93,8 @@ def loss_scale_manager_common(strategy1):
assert False
def test_dataset_interface_sens_scalar():
def fixme_test_dataset_interface_sens_scalar():
# With error: "The type of sens node is not Tensor or Parameter, it is unsupported now."
strategy1 = ((8, 1), )
loss_scale_manager_common(strategy1)
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册