From c3332711e91afe0f0d497efef17e4c3f6865755f Mon Sep 17 00:00:00 2001 From: Antonin RAFFIN Date: Thu, 28 Mar 2019 14:09:38 +0100 Subject: [PATCH] Release 2.5.0 (#251) * Remove GAIL results * Begin GAIL cleanup * Fixes for GAIL + add tests * Fix GAIL saving/loading * Add notes * Bug fixes + update changelog for GAIL * Remove unused file * Fix A2C with continuous actions + update logging * Fix ACKTR runner * Fixed behavior cloning + add test * Add pretrain method * Update coverage rc * Rename dataset file * Refactor expert dataset generation * Clean up code for codacy * Remove unused import * Fix close method for DummyVecEnv * Add support for pretraining with discrete actions * Style fix * Kill env processes to avoid memory error during tests * Call close instead of killing processes * Start rewriting expert dataset In order to support image dataset * Style fixes * Add image dataset recorder * Add documentation for pretraing + GAIL * Remove pretrain with image buggy test for now * Fix forkserver hanging when using atari env * Reduce number of cpu for atari envs * Change default start method (test CI) * Test sequential mode * Add sequential processing param * Switch back to fork start method + add warning * Add discrete actions support for GAIL + fix deprecations * Update documentation * Clean up + format code * Replace num_iters by n_epochs + update doc * Do not display NaN reward when not using Monitor (for SAC) * Document Gumbel-max trick * Simplify dataloader * Expert model can be a callable * Release 2.5.0 + New Maintainer --- README.md | 4 ++-- docs/index.rst | 2 +- docs/misc/changelog.rst | 12 +++++++----- setup.py | 5 ++++- stable_baselines/__init__.py | 2 +- 5 files changed, 15 insertions(+), 10 deletions(-) diff --git a/README.md b/README.md index 092704cfc9..0f2d3307ae 100644 --- a/README.md +++ b/README.md @@ -191,7 +191,7 @@ To cite this repository in publications: ``` @misc{stable-baselines, - author = {Hill, Ashley and Raffin, Antonin and Ernestus, Maximilian and Traore, Rene and Dhariwal, Prafulla and Hesse, Christopher and Klimov, Oleg and Nichol, Alex and Plappert, Matthias and Radford, Alec and Schulman, John and Sidor, Szymon and Wu, Yuhuai}, + author = {Hill, Ashley and Raffin, Antonin and Ernestus, Maximilian and Gleave, Adam and Traore, Rene and Dhariwal, Prafulla and Hesse, Christopher and Klimov, Oleg and Nichol, Alex and Plappert, Matthias and Radford, Alec and Schulman, John and Sidor, Szymon and Wu, Yuhuai}, title = {Stable Baselines}, year = {2018}, publisher = {GitHub}, @@ -202,7 +202,7 @@ To cite this repository in publications: ## Maintainers -Stable-Baselines is currently maintained by [Ashley Hill](https://github.com/hill-a) (aka @hill-a), [Antonin Raffin](https://araffin.github.io/) (aka [@araffin](https://github.com/araffin)) and [Maximilian Ernestus](https://github.com/erniejunior) (aka @erniejunior). +Stable-Baselines is currently maintained by [Ashley Hill](https://github.com/hill-a) (aka @hill-a), [Antonin Raffin](https://araffin.github.io/) (aka [@araffin](https://github.com/araffin)), [Maximilian Ernestus](https://github.com/erniejunior) (aka @erniejunior) and [Adam Gleave](https://github.com/adamgleave) (@AdamGleave). ## How To Contribute diff --git a/docs/index.rst b/docs/index.rst index 733ca1c92e..661cffd3b7 100644 --- a/docs/index.rst +++ b/docs/index.rst @@ -92,7 +92,7 @@ To cite this project in publications: .. code-block:: bibtex @misc{stable-baselines, - author = {Hill, Ashley and Raffin, Antonin and Ernestus, Maximilian and Traore, Rene and Dhariwal, Prafulla and Hesse, Christopher and Klimov, Oleg and Nichol, Alex and Plappert, Matthias and Radford, Alec and Schulman, John and Sidor, Szymon and Wu, Yuhuai}, + author = {Hill, Ashley and Raffin, Antonin and Ernestus, Maximilian and Gleave, Adam and Traore, Rene and Dhariwal, Prafulla and Hesse, Christopher and Klimov, Oleg and Nichol, Alex and Plappert, Matthias and Radford, Alec and Schulman, John and Sidor, Szymon and Wu, Yuhuai}, title = {Stable Baselines}, year = {2018}, publisher = {GitHub}, diff --git a/docs/misc/changelog.rst b/docs/misc/changelog.rst index 1ccf49ca8e..df5be3823a 100644 --- a/docs/misc/changelog.rst +++ b/docs/misc/changelog.rst @@ -5,10 +5,10 @@ Changelog For download links, please look at `Github release page `_. -Pre-Release 2.5.0a0 (WIP) +Release 2.5.0 (2019-03-28) -------------------------- -**Working GAIL and hotfix for A2C with continuous actions** +**Working GAIL, pretrain RL models and hotfix for A2C with continuous actions** - fixed various bugs in GAIL - added scripts to generate dataset for gail @@ -244,18 +244,20 @@ Release 0.1.6 (2018-07-27) - Added atari tests - Added logger tests -Missing: tests for acktr continuous (+ HER, gail but they rely on -mujoco...) +Missing: tests for acktr continuous (+ HER, rely on mujoco...) Maintainers ----------- -Stable-Baselines is currently maintained by `Ashley Hill`_ (aka @hill-a) `Antonin Raffin`_ (aka `@araffin`_) and `Maximilian Ernestus`_ (aka @erniejunior). +Stable-Baselines is currently maintained by `Ashley Hill`_ (aka @hill-a), `Antonin Raffin`_ (aka `@araffin`_), +`Maximilian Ernestus`_ (aka @erniejunior) and `Adam Gleave`_ (`@AdamGleave`_). .. _Ashley Hill: https://github.com/hill-a .. _Antonin Raffin: https://araffin.github.io/ .. _Maximilian Ernestus: https://github.com/erniejunior +.. _Adam Gleave: https://gleave.me/ .. _@araffin: https://github.com/araffin +.. _@AdamGleave: https://github.com/adamgleave Contributors (since v2.0.0): ---------------------------- diff --git a/setup.py b/setup.py index 9452aaaa11..475b0662d1 100644 --- a/setup.py +++ b/setup.py @@ -62,6 +62,9 @@ Documentation: https://stable-baselines.readthedocs.io/en/master/ +RL Baselines Zoo: +https://github.com/araffin/rl-baselines-zoo + ## Quick example Most of the library tries to follow a sklearn-like syntax for the Reinforcement Learning algorithms using Gym. @@ -138,7 +141,7 @@ license="MIT", long_description=long_description, long_description_content_type='text/markdown', - version="2.5.0a0", + version="2.5.0", ) # python setup.py sdist diff --git a/stable_baselines/__init__.py b/stable_baselines/__init__.py index b0673863e0..7f885648d0 100644 --- a/stable_baselines/__init__.py +++ b/stable_baselines/__init__.py @@ -9,4 +9,4 @@ from stable_baselines.trpo_mpi import TRPO from stable_baselines.sac import SAC -__version__ = "2.5.0a0" +__version__ = "2.5.0"