* rm old comment

jingweiz · Aug 21, 2017 · 907107b · 907107b
1 parent c6e4edc
commit 907107b
Showing 1 changed file with 0 additions and 1 deletion.
diff --git a/core/agents/acer_single_process.py b/core/agents/acer_single_process.py
@@ -263,7 +263,6 @@ def _backward(self, on_policy=True):
             # NOTE: here we can backprop both losses at once, but to make consistent
             # NOTE: and avoid the need to keep track of another set of undetached policy loss
             # NOTE: we also decouple the backprop of the policy loss into two stages
-            # 1.2 backprop from the network output to the whole model
             backward(variables=self.rollout.policy_vb, grad_variables=policy_grad_vb, retain_graph=True)
         # 2. backprop the value loss and entropy loss
         (value_loss_vb + self.master.beta * entropy_loss_vb).backward()