Skip to content

Commit

Permalink
Update
Browse files Browse the repository at this point in the history
[ghstack-poisoned]
  • Loading branch information
vmoens committed Dec 15, 2024
1 parent 6fe27a8 commit 99db504
Show file tree
Hide file tree
Showing 2 changed files with 2 additions and 2 deletions.
2 changes: 1 addition & 1 deletion sota-implementations/ppo/ppo_mujoco.py
Original file line number Diff line number Diff line change
Expand Up @@ -192,7 +192,7 @@ def update(batch, num_network_updates):
# extract cfg variables
cfg_loss_ppo_epochs = cfg.loss.ppo_epochs
cfg_optim_anneal_lr = cfg.optim.anneal_lr
cfg_optim_lr = cfg.optim.lr
cfg_optim_lr = torch.tensor(cfg.optim.lr, device=device)
cfg_loss_anneal_clip_eps = cfg.loss.anneal_clip_epsilon
cfg_loss_clip_epsilon = cfg.loss.clip_epsilon
cfg_logger_test_interval = cfg.logger.test_interval
Expand Down
2 changes: 1 addition & 1 deletion sota-implementations/ppo/utils_mujoco.py
Original file line number Diff line number Diff line change
Expand Up @@ -77,7 +77,7 @@ def make_ppo_models_state(proof_environment, device):
policy_mlp,
AddStateIndependentNormalScale(
proof_environment.action_spec_unbatched.shape[-1], scale_lb=1e-8
),
).to(device),
)

# Add probabilistic sampling of the actions
Expand Down

0 comments on commit 99db504

Please sign in to comment.