diff --git a/python/paddle/jit/translated_layer.py b/python/paddle/jit/translated_layer.py index daea9238733c54ee4489fae546e4a83e42359a50..a5f31c9bea3eea1b1701e01a0d5fcd0065c7218d 100644 --- a/python/paddle/jit/translated_layer.py +++ b/python/paddle/jit/translated_layer.py @@ -338,6 +338,7 @@ class _ProgramHolder: self._output_descs = [] self._double_grad_descs = [] self._persistable_names = [] + self._grad_var_names = {} # execution scope self._inner_scope = core.Scope() @@ -350,7 +351,6 @@ class _ProgramHolder: self._train_program_desc = self._append_backward_desc( self._infer_program_desc ) - self._grad_var_names = {} # forward: @switch_to_static_graph