Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion README.md
Original file line number Diff line number Diff line change
@@ -1,6 +1,6 @@
<img src="docs/\_static/img/logo.png" align="right" width="40%"/>

[![CI](https://github.com/Stable-Baselines-Team/stable-baselines3-contrib/workflows/CI/badge.svg)](https://github.com/Stable-Baselines-Team/stable-baselines3-contrib/actions) [![codestyle](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black)
[![CI](https://github.com/Stable-Baselines-Team/stable-baselines3-contrib/actions/workflows/ci.yml/badge.svg)](https://github.com/Stable-Baselines-Team/stable-baselines3-contrib/actions/workflows/ci.yml) [![codestyle](https://img.shields.io/badge/code%20style-black-000000.svg)](https://github.com/psf/black)

# Stable-Baselines3 - Contrib (SB3-Contrib)

Expand Down
2 changes: 1 addition & 1 deletion sb3_contrib/common/envs/invalid_actions_env.py
Original file line number Diff line number Diff line change
Expand Up @@ -20,7 +20,7 @@ def __init__(
dim = 1
assert n_invalid_actions < dim, f"Too many invalid actions: {n_invalid_actions} < {dim}"

space = spaces.Discrete(dim)
space = spaces.Discrete(dim) # type: ignore[var-annotated]
self.n_invalid_actions = n_invalid_actions
self.possible_actions = np.arange(space.n, dtype=int)
self.invalid_actions: list[int] = []
Expand Down
6 changes: 3 additions & 3 deletions tests/wrappers/test_action_masker.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,7 +6,7 @@


class IdentityEnvDiscrete(IdentityEnv):
def __init__(self, dim: int = 1, ep_length: int = 100):
def __init__(self, dim=1, ep_length=100):
"""
Identity environment for testing purposes
Expand All @@ -17,12 +17,12 @@ def __init__(self, dim: int = 1, ep_length: int = 100):
self.useless_property = 1
super().__init__(ep_length=ep_length, space=space)

def _action_masks(self) -> list[int]:
def _action_masks(self): # -> list[bool]
assert isinstance(self.action_space, spaces.Discrete)
return [i == self.state for i in range(self.action_space.n)]


def action_mask_fn(env: IdentityEnvDiscrete) -> list[int]:
def action_mask_fn(env): # -> list[int]
assert isinstance(env.action_space, spaces.Discrete)
return [i == env.state for i in range(env.action_space.n)]

Expand Down