fix compatibility issue with the newest paddle (#218)

* fix compatibility issue with the newest paddle * remove logging lines Co-authored-by: N robot <zenghongsheng@baidu.com>

fix compatibility issue with the newest paddle (#218)
* fix compatibility issue with the newest paddle * remove logging lines Co-authored-by: N robot <zenghongsheng@baidu.com>
7a16adc0 · Bo Zhou · GitHub · d96dba18 · 7a16adc0 · 7a16adc0
隐藏空白更改
内联并排

Showing with 4 addition and 2 deletion

parl/algorithms/fluid/a3c.py parl/algorithms/fluid/a3c.py +1 -0

parl/algorithms/fluid/maddpg.py parl/algorithms/fluid/maddpg.py +3 -2

未找到文件。
--- a/parl/algorithms/fluid/a3c.py
+++ b/parl/algorithms/fluid/a3c.py
@@ -72,6 +72,7 @@ class A3C(Algorithm):
        policy_entropy = policy_distribution.entropy()
        entropy = layers.reduce_sum(policy_entropy)
+        entropy_coeff = layers.reshape(entropy_coeff, shape=[1])
        total_loss = (
            pi_loss + vf_loss * self.vf_loss_coeff + entropy * entropy_coeff)

--- a/parl/algorithms/fluid/maddpg.py
+++ b/parl/algorithms/fluid/maddpg.py
@@ -27,10 +27,11 @@ from parl.core.fluid.policy_distribution import SoftMultiCategoricalDistribution
 def SoftPDistribution(logits, act_space):
-    """input:
+    """Args:
            logits: the output of policy model
            act_space: action space, must be gym.spaces.Discrete or multiagent.multi_discrete.MultiDiscrete
-        output：
+        Return:
            instance of SoftCategoricalDistribution or SoftMultiCategoricalDistribution
    """
    # is instance of gym.spaces.Discrete