Skip to content

Commit 99fb972

Browse files
revert
1 parent 5549e95 commit 99fb972

File tree

2 files changed

+3
-2
lines changed

2 files changed

+3
-2
lines changed

pufferlib/environments/metta/environment.py

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -71,4 +71,5 @@ def __init__(self, env_cfg, render_mode='human', buf=None, seed=0):
7171
env_cfg=env_cfg,
7272
render_mode=render_mode,
7373
replay_writer=self.replay_writer,
74+
is_training=True, # Enable training mode for desync_episodes
7475
)

pufferlib/pufferl.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -279,8 +279,8 @@ def evaluate(self):
279279
logits, value = self.policy.forward_eval(o_device, state)
280280
action, logprob, _ = pufferlib.pytorch.sample_logits(logits)
281281
# Skip reward clipping for Metta environments to preserve multi-agent reward signals
282-
if not self._is_metta_env():
283-
r = torch.clamp(r, -1, 1)
282+
# if not self._is_metta_env():
283+
# r = torch.clamp(r, -1, 1)
284284

285285
profile('eval_copy', epoch)
286286
with torch.no_grad():

0 commit comments

Comments
 (0)