Skip to content

Commit c6d3b0e

Browse files
authored
Merge branch 'master' into fix/car-racing-v3
2 parents 6ee50f8 + ad1ae18 commit c6d3b0e

File tree

19 files changed

+76
-35
lines changed

19 files changed

+76
-35
lines changed

.github/workflows/ci.yml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -53,6 +53,7 @@ jobs:
5353
run: |
5454
uv pip install --system gymnasium==${{ matrix.gymnasium-version }}
5555
uv pip install --system "numpy<2"
56+
uv pip install --system "ale-py==0.10.1"
5657
# Only run for python 3.10, downgrade gym to 0.29.1
5758
if: matrix.gymnasium-version != '1.0.0'
5859

.github/workflows/trained_agents.yml

Lines changed: 1 addition & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -49,14 +49,12 @@ jobs:
4949
# Use headless version
5050
uv pip install --system opencv-python-headless
5151
uv pip install --system -e .[plots,tests]
52-
# Downgrade numpy to run pybullet agents
53-
# See https://github.com/bulletphysics/bullet3/issues/4649
54-
uv pip install --system "numpy<2"
5552
5653
- name: Install specific version of gym
5754
run: |
5855
uv pip install --system gymnasium==${{ matrix.gymnasium-version }}
5956
uv pip install --system "numpy<2"
57+
uv pip install --system "ale-py==0.10.1"
6058
# Only run for python 3.10, downgrade gym to 0.29.1
6159
if: matrix.gymnasium-version != '1.0.0'
6260

CHANGELOG.md

Lines changed: 17 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,20 @@
1+
## Release 2.6.1 (WIP)
2+
3+
### Breaking Changes
4+
- Upgraded to SB3 >= 2.6.1
5+
- `linear_schedule` now returns a `SimpleLinearSchedule` object for better portability
6+
- Renamed `LunarLander-v2` to `LunarLander-v3` in hyperparameters
7+
8+
### New Features
9+
10+
### Bug fixes
11+
- Docker GPU images are now working again
12+
- Use `ConstantSchedule`, and `SimpleLinearSchedule` instead of `constant_fn` and `linear_schedule`
13+
14+
### Documentation
15+
16+
### Other
17+
118
## Release 2.6.0 (2025-03-24)
219

320
### Breaking Changes

docker/Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
ARG PARENT_IMAGE
1+
ARG PARENT_IMAGE=stablebaselines/stable-baselines3
22
FROM $PARENT_IMAGE
33

44
USER root

hyperparams/a2c.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ CartPole-v1:
1919
policy: 'MlpPolicy'
2020
ent_coef: 0.0
2121

22-
LunarLander-v2:
22+
LunarLander-v3:
2323
n_envs: 8
2424
n_timesteps: !!float 2e5
2525
policy: 'MlpPolicy'

hyperparams/ars.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,7 @@ Pendulum-v1: &pendulum-params
1919
zero_policy: False
2020

2121
# TO BE Tuned
22-
LunarLander-v2:
22+
LunarLander-v3:
2323
<<: *pendulum-params
2424
n_delta: 6
2525
n_top: 1

hyperparams/dqn.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -50,7 +50,7 @@ MountainCar-v0:
5050
policy_kwargs: "dict(net_arch=[256, 256])"
5151

5252
# Tuned
53-
LunarLander-v2:
53+
LunarLander-v3:
5454
n_timesteps: !!float 1e5
5555
policy: 'MlpPolicy'
5656
learning_rate: !!float 6.3e-4

hyperparams/ppo.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -111,7 +111,7 @@ BipedalWalkerHardcore-v3:
111111
learning_rate: lin_2.5e-4
112112
clip_range: lin_0.2
113113

114-
LunarLander-v2:
114+
LunarLander-v3:
115115
n_envs: 16
116116
n_timesteps: !!float 1e6
117117
policy: 'MlpPolicy'

hyperparams/qrdqn.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -43,7 +43,7 @@ MountainCar-v0:
4343
policy_kwargs: "dict(net_arch=[256, 256], n_quantiles=25)"
4444

4545
# Tuned
46-
LunarLander-v2:
46+
LunarLander-v3:
4747
n_timesteps: !!float 1e5
4848
policy: 'MlpPolicy'
4949
learning_rate: lin_1.5e-3

hyperparams/trpo.yml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ Pendulum-v1:
2323
sde_sample_freq: 4
2424

2525
# Tuned
26-
LunarLander-v2:
26+
LunarLander-v3:
2727
n_envs: 2
2828
n_timesteps: !!float 2e5
2929
policy: 'MlpPolicy'

0 commit comments

Comments
 (0)