diff --git a/qdax/core/emitters/omg_mega_emitter.py b/qdax/core/emitters/omg_mega_emitter.py index 228997b3..113abfab 100644 --- a/qdax/core/emitters/omg_mega_emitter.py +++ b/qdax/core/emitters/omg_mega_emitter.py @@ -43,7 +43,7 @@ class OMGMEGAEmitter(Emitter): times. One solution that we are discussing and that is very similar to the first solution discussed above, would be to decompose the addition mechanism in two phases: one outputting the indices at which individuals will be added, and then - the actual insertion step. This would enable to reusethe same indices to add + the actual insertion step. This would enable to reuse the same indices to add the gradients instead of having to recompute them. The two design choices seem acceptable and enable to have OMG MEGA compatible diff --git a/qdax/environments/pointmaze.py b/qdax/environments/pointmaze.py index 00faa7d7..a9715329 100644 --- a/qdax/environments/pointmaze.py +++ b/qdax/environments/pointmaze.py @@ -110,7 +110,7 @@ def reset(self, rng: jp.ndarray) -> State: x_init = jp.random_uniform(rng1, (), low=self._x_min, high=self._x_max) / 10 y_init = jp.random_uniform(rng2, (), low=self._y_min, high=-0.7) obs_init = jp.array([x_init, y_init]) - # create fake qp (to reusebrax.State) + # create fake qp (to reuse brax.State) fake_qp = brax.QP.zero() # init reward, metrics and infos reward, done = jp.zeros(2)