We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 4436f89 commit eb5c00eCopy full SHA for eb5c00e
1 file changed
docs/tutorials/training_agents/action_masking_taxi.py
@@ -170,7 +170,7 @@ def train_q_learning(
170
print(f"Run {i + 1}/{n_runs} with seed {seed}")
171
172
# Train agent WITH action masking
173
- env_masked = gym.make("Taxi-v3")
+ env_masked = gym.make("Taxi-v4")
174
masked_results = train_q_learning(
175
env_masked,
176
use_action_mask=True,
@@ -184,7 +184,7 @@ def train_q_learning(
184
masked_results_list.append(masked_results)
185
186
# Train agent WITHOUT action masking
187
- env_unmasked = gym.make("Taxi-v3")
+ env_unmasked = gym.make("Taxi-v4")
188
unmasked_results = train_q_learning(
189
env_unmasked,
190
use_action_mask=False,
0 commit comments