Change example to time limit

m-wojnar · m-wojnar · commit cb989078c130 · 2025-09-29T18:12:00.000+02:00
diff --git a/examples/cart-pole-vectorized/main.py b/examples/cart-pole-vectorized/main.py
@@ -6,7 +6,6 @@
 import optax
 from chex import Array
 from flax import linen as nn
-from tqdm import tqdm
 
 from reinforced_lib import RLib
 from reinforced_lib.agents.deep import PPODiscrete
@@ -48,14 +47,14 @@ def __call__(self, x: Array) -> tuple[Array, Array]:
         return logits, values
 
 
-def run(num_steps: int, num_envs: int, seed: int) -> None:
+def run(time_limit: float, num_envs: int, seed: int) -> None:
     """
     Run ``num_steps`` cart-pole Gymnasium steps.
 
     Parameters
     ----------
-    num_steps : int
-        Number of simulation steps to perform.
+    time_limit : float
+        Maximum time (in seconds) to run the experiment.
     num_envs : int
         Number of parallel environments to use.
     seed : int
@@ -96,15 +95,12 @@ def make_env():
     return_0, step = 0, 0
     start_time = time.perf_counter()
 
-    pbar = tqdm(total=num_steps)
-
-    while step < num_steps:
+    while time.perf_counter() - start_time < time_limit:
         env_states = env.step(np.asarray(actions))
         actions = rl.sample(*env_states)
 
         return_0 += env_states[1][0]
         step += num_envs
-        pbar.update(num_envs)
 
         if env_states[2][0] or env_states[3][0]:
             rl.log('return', return_0)
@@ -116,7 +112,7 @@ def make_env():
 if __name__ == '__main__':
     args = ArgumentParser()
 
-    args.add_argument('--num_steps', default=int(1e7), type=int)
+    args.add_argument('--time_limit', default=120, type=float)
     args.add_argument('--num_envs', default=64, type=int)
     args.add_argument('--seed', default=42, type=int)
 
diff --git a/pyproject.toml b/pyproject.toml
@@ -50,6 +50,5 @@ full = [
     # "ns3-ai==1.0.2",
     "pygame~=2.6.1",
     "seaborn~=0.13.2",
-    "tensorflow~=2.19.1",
-    "tqdm~=4.67.1"
+    "tensorflow~=2.19.1"
 ]

Original file line number	Diff line number	Diff line change
`@@ -50,6 +50,5 @@ full = [`
`50`	`50`	`# "ns3-ai==1.0.2",`
`51`	`51`	`"pygame~=2.6.1",`
`52`	`52`	`"seaborn~=0.13.2",`
`53`		`- "tensorflow~=2.19.1",`
`54`		`- "tqdm~=4.67.1"`
	`53`	`+ "tensorflow~=2.19.1"`
`55`	`54`	`]`