From 309ad8cd69b4db114fc0fb584e9949919cdd5835 Mon Sep 17 00:00:00 2001 From: Antonin RAFFIN Date: Tue, 21 Feb 2023 23:20:57 +0100 Subject: [PATCH] [ci skip] Tune RecurrentPPO Swimmer-v3 (#360) --- CHANGELOG.md | 1 + hyperparams/ppo_lstm.yml | 6 +++++- 2 files changed, 6 insertions(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index e0c3eca94..cb0cc12a8 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -4,6 +4,7 @@ - Upgraded to SB3 >= 1.8.0 ### New Features +- Tuned hyperparameters for RecurrentPPO on Swimmer ### Bug fixes - Set ``highway-env`` version to 1.5 and ``setuptools to`` v65.5 for the CI diff --git a/hyperparams/ppo_lstm.yml b/hyperparams/ppo_lstm.yml index ebd84f4a1..b29087e10 100644 --- a/hyperparams/ppo_lstm.yml +++ b/hyperparams/ppo_lstm.yml @@ -339,7 +339,11 @@ Ant-v3: &mujoco-defaults Swimmer-v3: <<: *mujoco-defaults gamma: 0.9999 - + n_envs: 4 + n_steps: 1024 + batch_size: 256 + learning_rate: !!float 6e-4 + gae_lambda: 0.98 # 10 mujoco envs