adaptive-intelligent-robotics
diff --git a/‎.github/workflows/ci.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/ci.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎examples/aurora.ipynb‎
Lines changed: 2 additions & 2 deletions b/‎examples/aurora.ipynb‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎examples/cmaes.ipynb‎
Lines changed: 2 additions & 2 deletions b/‎examples/cmaes.ipynb‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎examples/cmame.ipynb‎
Lines changed: 7 additions & 7 deletions b/‎examples/cmame.ipynb‎
Lines changed: 7 additions & 7 deletions
diff --git a/‎examples/cmamega.ipynb‎
Lines changed: 6 additions & 6 deletions b/‎examples/cmamega.ipynb‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎examples/dads.ipynb‎
Lines changed: 5 additions & 17 deletions b/‎examples/dads.ipynb‎
Lines changed: 5 additions & 17 deletions
diff --git a/‎examples/dcrlme.ipynb‎
Lines changed: 6 additions & 6 deletions b/‎examples/dcrlme.ipynb‎
Lines changed: 6 additions & 6 deletions
diff --git a/‎examples/diayn.ipynb‎
Lines changed: 5 additions & 17 deletions b/‎examples/diayn.ipynb‎
Lines changed: 5 additions & 17 deletions
diff --git a/‎examples/distributed_mapelites.ipynb‎
Lines changed: 2 additions & 2 deletions b/‎examples/distributed_mapelites.ipynb‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎examples/jumanji_snake.ipynb‎
Lines changed: 2 additions & 2 deletions b/‎examples/jumanji_snake.ipynb‎
Lines changed: 2 additions & 2 deletions
@@ -16,7 +16,7 @@ jobs:
       - name: Set up Python
         uses: actions/setup-python@v5
         with:
-          python-version: '3.11'
+          python-version: "3.11"
 
       - name: Install system dependencies
         run: |
 
@@ -79,8 +79,8 @@
     "\n",
     "from qdax.core.aurora import AURORA\n",
     "from qdax.core.containers.unstructured_repertoire import UnstructuredRepertoire\n",
-    "import qdax.tasks.brax.v1 as environments\n",
-    "from qdax.tasks.brax.v1.env_creators import (\n",
+    "import qdax.tasks.brax as environments\n",
+    "from qdax.tasks.brax.env_creators import (\n",
     "    create_default_brax_task_components,\n",
     "    get_aurora_scoring_fn,\n",
     ")\n",
 
@@ -129,12 +129,12 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "def rastrigin_scoring(x: jnp.ndarray):\n",
+    "def rastrigin_scoring(x: jax.Array):\n",
     "    first_term = 10 * x.shape[-1]\n",
     "    second_term = jnp.sum((x + minval * 0.4) ** 2 - 10 * jnp.cos(2 * jnp.pi * (x + minval * 0.4)))\n",
     "    return -(first_term + second_term)\n",
     "\n",
-    "def sphere_scoring(x: jnp.ndarray):\n",
+    "def sphere_scoring(x: jax.Array):\n",
     "    return -jnp.sum((x + minval * 0.4) * (x + minval * 0.4), axis=-1)\n",
     "\n",
     "if optim_problem == \"sphere\":\n",
 
@@ -132,12 +132,12 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "def rastrigin_scoring(x: jnp.ndarray):\n",
+    "def rastrigin_scoring(x: jax.Array):\n",
     "    first_term = 10 * x.shape[-1]\n",
     "    second_term = jnp.sum((x + minval * 0.4) ** 2 - 10 * jnp.cos(2 * jnp.pi * (x + minval * 0.4)))\n",
     "    return -(first_term + second_term)\n",
     "\n",
-    "def sphere_scoring(x: jnp.ndarray):\n",
+    "def sphere_scoring(x: jax.Array):\n",
     "    return -jnp.sum((x + minval * 0.4) * (x + minval * 0.4), axis=-1)\n",
     "\n",
     "if optim_problem == \"sphere\":\n",
@@ -147,21 +147,21 @@
     "else:\n",
     "    raise Exception(\"Invalid opt function name given\")\n",
     "\n",
-    "def clip(x: jnp.ndarray):\n",
+    "def clip(x: jax.Array):\n",
     "    in_bound = (x <= maxval) * (x >= minval)\n",
     "    return jnp.where(\n",
     "        in_bound,\n",
     "        x,\n",
     "        (maxval / x)\n",
     "    )\n",
     "\n",
-    "def _descriptor_1(x: jnp.ndarray):\n",
+    "def _descriptor_1(x: jax.Array):\n",
     "    return jnp.sum(clip(x[:x.shape[-1]//2]))\n",
     "\n",
-    "def _descriptor_2(x: jnp.ndarray):\n",
+    "def _descriptor_2(x: jax.Array):\n",
     "    return jnp.sum(clip(x[x.shape[-1]//2:]))\n",
     "\n",
-    "def _descriptors(x: jnp.ndarray):\n",
+    "def _descriptors(x: jax.Array):\n",
     "    return jnp.array([_descriptor_1(x), _descriptor_2(x)])"
    ]
   },
@@ -198,7 +198,7 @@
     "\n",
     "num_centroids = math.prod(grid_shape)\n",
     "\n",
-    "def metrics_fn(repertoire: MapElitesRepertoire) -> Dict[str, jnp.ndarray]:\n",
+    "def metrics_fn(repertoire: MapElitesRepertoire) -> Dict[str, jax.Array]:\n",
     "\n",
     "    # get metrics\n",
     "    grid_empty = repertoire.fitnesses == -jnp.inf\n",
 
@@ -124,19 +124,19 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "def rastrigin_scoring(x: jnp.ndarray):\n",
+    "def rastrigin_scoring(x: jax.Array\n",
     "    return -(10 * x.shape[-1] + jnp.sum((x+minval*0.4)**2 - 10 * jnp.cos(2 * jnp.pi * (x+minval*0.4))))\n",
     "\n",
-    "def clip(x: jnp.ndarray):\n",
+    "def clip(x: jax.Array\n",
     "    return x*(x<=maxval)*(x>=+minval) + maxval/x*((x>maxval)+(x<+minval))\n",
     "\n",
-    "def _rastrigin_descriptor_1(x: jnp.ndarray):\n",
+    "def _rastrigin_descriptor_1(x: jax.Array\n",
     "    return jnp.mean(clip(x[:x.shape[-1]//2]))\n",
     "\n",
-    "def _rastrigin_descriptor_2(x: jnp.ndarray):\n",
+    "def _rastrigin_descriptor_2(x: jax.Array\n",
     "    return jnp.mean(clip(x[x.shape[-1]//2:]))\n",
     "\n",
-    "def rastrigin_descriptors(x: jnp.ndarray):\n",
+    "def rastrigin_descriptors(x: jax.Array\n",
     "    return jnp.array([_rastrigin_descriptor_1(x), _rastrigin_descriptor_2(x)])\n",
     "\n",
     "rastrigin_grad_scores = jax.grad(rastrigin_scoring)"
@@ -191,7 +191,7 @@
     "best_objective = rastrigin_scoring(jnp.ones(num_dimensions) * 5.12 * 0.4)\n",
     "\n",
     "\n",
-    "def metrics_fn(repertoire: MapElitesRepertoire) -> Dict[str, jnp.ndarray]:\n",
+    "def metrics_fn(repertoire: MapElitesRepertoire) -> Dict[str, jax.Array\n",
     "\n",
     "    # get metrics\n",
     "    grid_empty = repertoire.fitnesses == -jnp.inf\n",
 
@@ -75,15 +75,14 @@
     "import jax\n",
     "import jax.numpy as jnp\n",
     "\n",
-    "import qdax.tasks.brax.v1 as environments\n",
+    "import qdax.tasks.brax as environments\n",
     "from qdax.baselines.dads import DADS, DadsConfig, DadsTrainingState\n",
     "from qdax.core.neuroevolution.buffers.buffer import QDTransition, ReplayBuffer\n",
     "from qdax.core.neuroevolution.sac_td3_utils import do_iteration_fn, warmstart_buffer\n",
     "\n",
     "from qdax.utils.plotting import plot_skills_trajectory\n",
     "\n",
-    "from IPython.display import HTML\n",
-    "from brax.v1.io import html"
+    "from IPython.display import HTML"
    ]
   },
   {
@@ -94,7 +93,7 @@
     "\n",
     "Most hyperparameters are similar to those introduced in [SAC paper](https://arxiv.org/abs/1801.01290), [DIAYN paper](https://arxiv.org/abs/1802.06070) and [DADS paper](https://arxiv.org/abs/1907.01657).\n",
     "\n",
-    "The parameter `descriptor_full_state` is less straightforward, it concerns the information used for diversity seeking and dynamics. In DADS, one can use the full state for diversity seeking, but one can also use a prior to focus on an interesting aspect of the state. Actually, priors are often used in experiments, for instance, focusing on the x/y position rather than the full position. When `descriptor_full_state` is set to True, it uses the full state, when it is set to False, it uses the 'state descriptor' retrieved by the environment. Hence, it is required that the environment has one. (All the `_uni`, `_omni` do, same for `anttrap`, `antmaze` and `pointmaze`.) In the future, we will add an option to use a prior function directly on the full state."
+    "The parameter `descriptor_full_state` is less straightforward, it concerns the information used for diversity seeking and dynamics. In DADS, one can use the full state for diversity seeking, but one can also use a prior to focus on an interesting aspect of the state. Actually, priors are often used in experiments, for instance, focusing on the x/y position rather than the full position. When `descriptor_full_state` is set to True, it uses the full state, when it is set to False, it uses the 'state descriptor' retrieved by the environment. Hence, it is required that the environment has one. In the future, we will add an option to use a prior function directly on the full state."
    ]
   },
   {
@@ -385,7 +384,7 @@
    "source": [
     "## Plot the trajectories of the skills at the end of the training\n",
     "\n",
-    "This only works when the state descriptor considered is two-dimensional, and as a real interest only when this state descriptor is the x/y position. Hence, on all \"omni\" tasks, on pointmaze, anttrap and antmaze."
+    "This only works when the state descriptor considered is two-dimensional, and as a real interest only when this state descriptor is the x/y position."
    ]
   },
   {
@@ -419,18 +418,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# Visualize the skills in the physical simulation\n",
-    "\n",
-    "WARNING: this does not work with \"pointmaze\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "assert env_name != \"pointmaze\", \"No visualisation available for pointmaze at the moment\""
+    "# Visualize the skills in the physical simulation"
    ]
   },
   {
 
@@ -80,17 +80,17 @@
     "import jax\n",
     "import jax.numpy as jnp\n",
     "\n",
-    "import qdax.tasks.brax.v1 as environments\n",
+    "import qdax.tasks.brax as environments\n",
     "from qdax.core.containers.mapelites_repertoire import compute_cvt_centroids\n",
     "from qdax.core.emitters.dcrl_me_emitter import DCRLMEConfig, DCRLMEEmitter\n",
     "from qdax.core.emitters.mutation_operators import isoline_variation\n",
     "from qdax.core.map_elites import MAPElites\n",
     "from qdax.core.neuroevolution.buffers.buffer import DCRLTransition\n",
     "from qdax.core.neuroevolution.networks.networks import MLP, MLPDC\n",
     "from qdax.custom_types import EnvState, Params, RNGKey\n",
-    "from qdax.tasks.brax.v1 import descriptor_extractor\n",
-    "from qdax.tasks.brax.v1.wrappers.reward_wrappers import OffsetRewardWrapper, ClipRewardWrapper\n",
-    "from qdax.tasks.brax.v1.env_creators import scoring_function_brax_envs\n",
+    "from qdax.tasks.brax import descriptor_extractor\n",
+    "from qdax.tasks.brax.wrappers.reward_wrappers import OffsetRewardWrapper, ClipRewardWrapper\n",
+    "from qdax.tasks.brax.env_creators import scoring_function_brax_envs\n",
     "from qdax.utils.plotting import plot_map_elites_results\n",
     "\n",
     "from qdax.utils.metrics import CSVLogger, default_qd_metrics"
@@ -436,7 +436,7 @@
  ],
  "metadata": {
   "kernelspec": {
-   "display_name": "venv",
+   "display_name": ".venv",
    "language": "python",
    "name": "python3"
   },
@@ -450,7 +450,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.10.12"
+   "version": "3.13.9"
   }
  },
  "nbformat": 4,
 
@@ -75,15 +75,14 @@
     "import jax\n",
     "import jax.numpy as jnp\n",
     "\n",
-    "import qdax.tasks.brax.v1 as environments\n",
+    "import qdax.tasks.brax as environments\n",
     "from qdax.baselines.diayn import DIAYN, DiaynConfig, DiaynTrainingState\n",
     "from qdax.core.neuroevolution.buffers.buffer import QDTransition, ReplayBuffer\n",
     "from qdax.core.neuroevolution.sac_td3_utils import do_iteration_fn, warmstart_buffer\n",
     "\n",
     "from qdax.utils.plotting import plot_skills_trajectory\n",
     "\n",
-    "from IPython.display import HTML\n",
-    "from brax.v1.io import html"
+    "from IPython.display import HTML"
    ]
   },
   {
@@ -94,7 +93,7 @@
     "\n",
     "Most hyperparameters are similar to those introduced in [SAC paper](https://arxiv.org/abs/1801.01290) and [DIAYN paper](https://arxiv.org/abs/1802.06070).\n",
     "\n",
-    "The parameter `descriptor_full_state` is less straightforward, it concerns the information used for diversity seeking and discrimination. In DIAYN, one can use the full state for diversity seeking, but one can also use a prior to focus on an interesting aspect of the state. Actually, priors are often used in experiments, for instance, focusing on the x/y position rather than the full position. When `descriptor_full_state` is set to True, it uses the full state, when it is set to False, it uses the 'state descriptor' retrieved by the environment. Hence, it is required that the environment has one. (All the `_uni`, `_omni` do, same for `anttrap`, `antmaze` and `pointmaze`.) In the future, we will add an option to use a prior function directly on the full state."
+    "The parameter `descriptor_full_state` is less straightforward, it concerns the information used for diversity seeking and discrimination. In DIAYN, one can use the full state for diversity seeking, but one can also use a prior to focus on an interesting aspect of the state. Actually, priors are often used in experiments, for instance, focusing on the x/y position rather than the full position. When `descriptor_full_state` is set to True, it uses the full state, when it is set to False, it uses the 'state descriptor' retrieved by the environment. Hence, it is required that the environment has one. In the future, we will add an option to use a prior function directly on the full state."
    ]
   },
   {
@@ -374,7 +373,7 @@
    "source": [
     "## Plot the trajectories of the skills at the end of the training\n",
     "\n",
-    "This only works when the state descriptor considered is two-dimensional, and as a real interest only when this state descriptor is the x/y position. Hence, on all \"omni\" tasks, on pointmaze, anttrap and antmaze."
+    "This only works when the state descriptor considered is two-dimensional, and as a real interest only when this state descriptor is the x/y position."
    ]
   },
   {
@@ -408,18 +407,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# Visualize the skills in the physical simulation\n",
-    "\n",
-    "WARNING: this does not work with \"pointmaze\""
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "assert env_name != \"pointmaze\", \"No visualisation available for pointmaze at the moment\""
+    "# Visualize the skills in the physical simulation"
    ]
   },
   {
 
@@ -81,8 +81,8 @@
     "\n",
     "from qdax.core.distributed_map_elites import DistributedMAPElites\n",
     "from qdax.core.containers.mapelites_repertoire import compute_cvt_centroids\n",
-    "import qdax.tasks.brax.v1 as environments\n",
-    "from qdax.tasks.brax.v1.env_creators import scoring_function_brax_envs as scoring_function\n",
+    "import qdax.tasks.brax as environments\n",
+    "from qdax.tasks.brax.env_creators import scoring_function_brax_envs as scoring_function\n",
     "from qdax.core.neuroevolution.buffers.buffer import QDTransition\n",
     "from qdax.core.neuroevolution.networks.networks import MLP\n",
     "from qdax.core.emitters.mutation_operators import isoline_variation\n",
 
@@ -284,7 +284,7 @@
    "outputs": [],
    "source": [
     "# Prepare the scoring function\n",
-    "def descriptor_extraction(data: QDTransition, mask: jnp.ndarray, linear_projection: jnp.ndarray) -> Descriptor:\n",
+    "def descriptor_extraction(data: QDTransition, mask: jax.Arraylinear_projection: jajax.Array Descriptor:\n",
     "    \"\"\"Compute feet contact time proportion.\n",
     "\n",
     "    This function suppose that state descriptor is the feet contact, as it\n",
@@ -340,7 +340,7 @@
    "outputs": [],
    "source": [
     "def scoring_function(\n",
-    "    genotypes: jnp.ndarray, key: RNGKey\n",
+    "    genotypes: jax.Arraykey: RNGKey\n",
     ") -> Tuple[Fitness, ExtraScores, RNGKey]:\n",
     "    fitnesses, _, extra_scores = scoring_fn(genotypes, key)\n",
     "    return fitnesses.reshape(-1, 1), extra_scores"