update comment, format

Juan de los Rios · vmoens · commit 4fc9e580eeb6 · 2025-08-01T14:12:32.000+01:00
diff --git a/test/test_cost.py b/test/test_cost.py
@@ -9779,11 +9779,11 @@ def mixture_constructor(logits, loc, scale):
             # keep per-head entropies instead of the aggregated tensor
             set_composite_lp_aggregate(False).set()
             coef_map = {
-                ("agent0", "action", "action1", "sub_action1_log_prob"):0.02,
-                ("agent0", "action", "action1", "sub_action2_log_prob"):0.01,
-                ("agent0", "action", "action2_log_prob"):0.01,
-                ("agent1", "action_log_prob"):0.01,
-                "agent2_log_prob":0.01,
+                ("agent0", "action", "action1", "sub_action1_log_prob"): 0.02,
+                ("agent0", "action", "action1", "sub_action2_log_prob"): 0.01,
+                ("agent0", "action", "action2_log_prob"): 0.01,
+                ("agent1", "action_log_prob"): 0.01,
+                "agent2_log_prob": 0.01,
             }
             ppo_weighted = cls(policy, value_operator, entropy_coeff=coef_map)
             ppo_weighted.set_keys(
@@ -9872,7 +9872,7 @@ def test_weighted_entropy_scalar(self):
         torch.testing.assert_close(out, torch.tensor(-1.0))
 
     def test_weighted_entropy_mapping(self):
-        coef = {("head_0","action_log_prob"): 0.3, ("head_1","action_log_prob"): 0.7}
+        coef = {("head_0", "action_log_prob"): 0.3, ("head_1", "action_log_prob"): 0.7}
         loss = self._make_entropy_loss(entropy_coeff=coef)
         entropy = TensorDict(
             {
@@ -9882,7 +9882,10 @@ def test_weighted_entropy_mapping(self):
             [],
         )
         out = loss._weighted_loss_entropy(entropy)
-        expected = -(coef[("head_0","action_log_prob")] * 1.0 + coef[("head_1","action_log_prob")] * 2.0)
+        expected = -(
+            coef[("head_0", "action_log_prob")] * 1.0
+            + coef[("head_1", "action_log_prob")] * 2.0
+        )
         torch.testing.assert_close(out, torch.tensor(expected))
 
     def test_weighted_entropy_mapping_missing_key(self):
diff --git a/torchrl/objectives/ppo.py b/torchrl/objectives/ppo.py
@@ -912,6 +912,7 @@ def _weighted_loss_entropy(
 
         If `self._entropy_coeff_map` is provided, apply per-head entropy coefficients.
         Otherwise, use the scalar `self.entropy_coeff`.
+        The entries in self._entropy_coeff_map require the full nested key to the entropy head.
         """
         if self._entropy_coeff_map is None:
             if is_tensor_collection(entropy):