diff --git a/CHANGELOG.md b/CHANGELOG.md index 8a472ec..cef7da2 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,4 +1,4 @@ -## Release 0.8.0a6 (WIP) +## Release 0.8.0 (2020-08-04) ### Breaking Changes @@ -10,6 +10,7 @@ - Added saving of command line args (@SammyRamone) - Added DDPG support - Added version +- Added ``RMSpropTFLike`` support ### Bug fixes - Fixed optuna warning (@SammyRamone) diff --git a/hyperparams/a2c.yml b/hyperparams/a2c.yml index 6f131ec..63fb97f 100644 --- a/hyperparams/a2c.yml +++ b/hyperparams/a2c.yml @@ -7,6 +7,7 @@ atari: n_timesteps: !!float 1e7 ent_coef: 0.01 vf_coef: 0.25 + policy_kwargs: "dict(optimizer_class=RMSpropTFLike)" CartPole-v1: n_envs: 8 diff --git a/requirements.txt b/requirements.txt index 4b85133..b0e5552 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,4 +1,4 @@ -stable-baselines3[extra,tests,docs]>=0.8.0a1 +stable-baselines3[extra,tests,docs]>=0.8.0 box2d-py==2.3.5 pybullet gym-minigrid diff --git a/train.py b/train.py index b2df452..79eec74 100644 --- a/train.py +++ b/train.py @@ -19,6 +19,7 @@ from stable_baselines3.common.callbacks import CheckpointCallback, EvalCallback from stable_baselines3.common.noise import NormalActionNoise, OrnsteinUhlenbeckActionNoise from stable_baselines3.common.preprocessing import is_image_space +from stable_baselines3.common.sb2_compat.rmsprop_tf_like import RMSpropTFLike # noqa: F401 from stable_baselines3.common.utils import constant_fn, set_random_seed # from stable_baselines3.common.cmd_util import make_atari_env diff --git a/version.txt b/version.txt index db50579..a3df0a6 100644 --- a/version.txt +++ b/version.txt @@ -1 +1 @@ -0.8.0a6 +0.8.0