diff --git a/python/paddle/fluid/incubate/fleet/parameter_server/ir/pserver_pass.py b/python/paddle/fluid/incubate/fleet/parameter_server/ir/pserver_pass.py index 28cb850b6138273dfb7b53aa3e6b410935e4d625..20f8aa3bb100da5fa622a4578997420250a63e70 100644 --- a/python/paddle/fluid/incubate/fleet/parameter_server/ir/pserver_pass.py +++ b/python/paddle/fluid/incubate/fleet/parameter_server/ir/pserver_pass.py @@ -658,8 +658,6 @@ def large_scale_sparse_pass(program, main_program, config, is_startup=False): if op.type == "sgd": grad = main_program.global_block().vars[op.input("Grad")[0]] lr = main_program.global_block().vars[op.input("LearningRate")[0]] - ## remove origin optimzier op - #block._remove_op(opt_idx) block._insert_op( opt_idx, @@ -679,18 +677,15 @@ def large_scale_sparse_pass(program, main_program, config, is_startup=False): 0]] beta2_pow = main_program.global_block().vars[op.input("Beta2Pow")[ 0]] - beta1_pow_o = main_program.global_block().vars[op.input( + beta1_pow_o = main_program.global_block().vars[op.output( "Beta1PowOut")[0]] - beta2_pow_o = main_program.global_block().vars[op.input( + beta2_pow_o = main_program.global_block().vars[op.output( "Beta2PowOut")[0]] beta1 = op.attr('shape') beta2 = op.attr('beta2') epsilon = op.attr('epsilon') - ## remove origin optimzier op - #block._remove_op(opt_idx) - block._insert_op( opt_idx, type="lookup_sparse_table_fuse_adam",