Downgrade sphinx-autodoc-typehints (#1291)

qgallouedec · web-flow · commit 69fdf155e107 · 2023-01-23T10:56:45.000+01:00
* Update setup.py

* black

* hotfix pytype
diff --git a/setup.py b/setup.py
@@ -117,7 +117,7 @@
             # For spelling
             "sphinxcontrib.spelling",
             # Type hints support
-            "sphinx-autodoc-typehints",
+            "sphinx-autodoc-typehints==1.21.1",  # TODO: remove version constraint, see #1290
             # Copy button for code snippets
             "sphinx_copybutton",
         ],
diff --git a/stable_baselines3/common/buffers.py b/stable_baselines3/common/buffers.py
@@ -474,7 +474,7 @@ def get(self, batch_size: Optional[int] = None) -> Generator[RolloutBufferSample
             yield self._get_samples(indices[start_idx : start_idx + batch_size])
             start_idx += batch_size
 
-    def _get_samples(self, batch_inds: np.ndarray, env: Optional[VecNormalize] = None) -> RolloutBufferSamples:
+    def _get_samples(self, batch_inds: np.ndarray, env: Optional[VecNormalize] = None) -> RolloutBufferSamples:  # type: ignore[signature-mismatch] #FIXME
         data = (
             self.observations[batch_inds],
             self.actions[batch_inds],
@@ -603,7 +603,7 @@ def add(
             self.full = True
             self.pos = 0
 
-    def sample(self, batch_size: int, env: Optional[VecNormalize] = None) -> DictReplayBufferSamples:
+    def sample(self, batch_size: int, env: Optional[VecNormalize] = None) -> DictReplayBufferSamples:  # type: ignore[signature-mismatch] #FIXME:
         """
         Sample elements from the replay buffer.
 
@@ -614,7 +614,7 @@ def sample(self, batch_size: int, env: Optional[VecNormalize] = None) -> DictRep
         """
         return super(ReplayBuffer, self).sample(batch_size=batch_size, env=env)
 
-    def _get_samples(self, batch_inds: np.ndarray, env: Optional[VecNormalize] = None) -> DictReplayBufferSamples:
+    def _get_samples(self, batch_inds: np.ndarray, env: Optional[VecNormalize] = None) -> DictReplayBufferSamples:  # type: ignore[signature-mismatch] #FIXME:
         # Sample randomly the env idx
         env_indices = np.random.randint(0, high=self.n_envs, size=(len(batch_inds),))
 
@@ -743,7 +743,7 @@ def add(
         if self.pos == self.buffer_size:
             self.full = True
 
-    def get(self, batch_size: Optional[int] = None) -> Generator[DictRolloutBufferSamples, None, None]:
+    def get(self, batch_size: Optional[int] = None) -> Generator[DictRolloutBufferSamples, None, None]:  # type: ignore[signature-mismatch] #FIXME
         assert self.full, ""
         indices = np.random.permutation(self.buffer_size * self.n_envs)
         # Prepare the data
@@ -767,7 +767,7 @@ def get(self, batch_size: Optional[int] = None) -> Generator[DictRolloutBufferSa
             yield self._get_samples(indices[start_idx : start_idx + batch_size])
             start_idx += batch_size
 
-    def _get_samples(self, batch_inds: np.ndarray, env: Optional[VecNormalize] = None) -> DictRolloutBufferSamples:
+    def _get_samples(self, batch_inds: np.ndarray, env: Optional[VecNormalize] = None) -> DictRolloutBufferSamples:  # type: ignore[signature-mismatch] #FIXME
 
         return DictRolloutBufferSamples(
             observations={key: self.to_torch(obs[batch_inds]) for (key, obs) in self.observations.items()},
diff --git a/stable_baselines3/common/envs/identity_env.py b/stable_baselines3/common/envs/identity_env.py
@@ -71,7 +71,7 @@ def __init__(self, low: float = -1.0, high: float = 1.0, eps: float = 0.05, ep_l
         super().__init__(ep_length=ep_length, space=space)
         self.eps = eps
 
-    def step(self, action: np.ndarray) -> GymStepReturn:
+    def step(self, action: np.ndarray) -> Tuple[np.ndarray, float, bool, Dict[str, Any]]:
         reward = self._get_reward(action)
         self._choose_next_state()
         self.current_step += 1
@@ -83,7 +83,7 @@ def _get_reward(self, action: np.ndarray) -> float:
 
 
 class IdentityEnvMultiDiscrete(IdentityEnv[np.ndarray]):
-    def __init__(self, dim: int = 1, ep_length: int = 100):
+    def __init__(self, dim: int = 1, ep_length: int = 100) -> None:
         """
         Identity environment for testing purposes
 
@@ -95,7 +95,7 @@ def __init__(self, dim: int = 1, ep_length: int = 100):
 
 
 class IdentityEnvMultiBinary(IdentityEnv[np.ndarray]):
-    def __init__(self, dim: int = 1, ep_length: int = 100):
+    def __init__(self, dim: int = 1, ep_length: int = 100) -> None:
         """
         Identity environment for testing purposes
 
@@ -126,7 +126,7 @@ def __init__(
         n_channels: int = 1,
         discrete: bool = True,
         channel_first: bool = False,
-    ):
+    ) -> None:
         self.observation_shape = (screen_height, screen_width, n_channels)
         if channel_first:
             self.observation_shape = (n_channels, screen_height, screen_width)