diff --git a/python/paddle/distributed/fleet/meta_optimizers/sharding_optimizer.py b/python/paddle/distributed/fleet/meta_optimizers/sharding_optimizer.py index 25f9928c826a901a2f014ce1a0b78f21655d8b7d..88ad5cbfdc32cc3c218bf7a18e164239fab4a4fd 100755 --- a/python/paddle/distributed/fleet/meta_optimizers/sharding_optimizer.py +++ b/python/paddle/distributed/fleet/meta_optimizers/sharding_optimizer.py @@ -755,9 +755,6 @@ class ShardingOptimizer(MetaOptimizerBase): sync=False, ) - if core.is_compiled_with_custom_device('npu'): - return - # GPU for pair in self.pipeline_pair: pair_key = pair[0] * 1000 + pair[1]