diff --git a/main/.doctrees/environment.pickle b/main/.doctrees/environment.pickle
index 94f38ab94..9ce8befeb 100644
Binary files a/main/.doctrees/environment.pickle and b/main/.doctrees/environment.pickle differ
diff --git a/main/.doctrees/faq.doctree b/main/.doctrees/faq.doctree
index e92445c2f..d38d8579e 100644
Binary files a/main/.doctrees/faq.doctree and b/main/.doctrees/faq.doctree differ
diff --git a/main/_sources/faq.rst.txt b/main/_sources/faq.rst.txt
index 0dfa74ee9..b7acbcd83 100644
--- a/main/_sources/faq.rst.txt
+++ b/main/_sources/faq.rst.txt
@@ -1,10 +1,11 @@
 Frequently Asked Questions
 ==========================
 
-.. warning::
+Do I have to use the provided search spaces? 
+    Ideally you would re-use the exisiting ones to facilitate comparison. However, you are free to define your own search space and clearly state this when reporting your results.
 
-    This page is under construction.
+Can I use different environments than the ones provided?
+    Yes, we also wrap gymnasium environment which enables many different frameworks. It is not always clear, however, that these will actually work correctly when jitted, so you should proceed with caution.
 
-
-Your first question here
-    Your answer here
+Where can I find the code for the experiments in the ARLBench paper?
+    The code for the experiments in the ARLBench paper can be found on the `experiments` branch of the ARLBench repo.
diff --git a/main/faq.html b/main/faq.html
index 62e212f46..78ac0bf19 100644
--- a/main/faq.html
+++ b/main/faq.html
@@ -315,12 +315,12 @@
                 
   <section id="frequently-asked-questions">
 <h1>Frequently Asked Questions<a class="headerlink" href="#frequently-asked-questions" title="Link to this heading">¶</a></h1>
-<div class="admonition warning">
-<p class="admonition-title">Warning</p>
-<p>This page is under construction.</p>
-</div>
 <dl class="simple">
-<dt>Your first question here</dt><dd><p>Your answer here</p>
+<dt>Do I have to use the provided search spaces?</dt><dd><p>Ideally you would re-use the exisiting ones to facilitate comparison. However, you are free to define your own search space and clearly state this when reporting your results.</p>
+</dd>
+<dt>Can I use different environments than the ones provided?</dt><dd><p>Yes, we also wrap gymnasium environment which enables many different frameworks. It is not always clear, however, that these will actually work correctly when jitted, so you should proceed with caution.</p>
+</dd>
+<dt>Where can I find the code for the experiments in the ARLBench paper?</dt><dd><p>The code for the experiments in the ARLBench paper can be found on the <cite>experiments</cite> branch of the ARLBench repo.</p>
 </dd>
 </dl>
 </section>
diff --git a/main/searchindex.js b/main/searchindex.js
index 14dd5cfd6..88a6d6a07 100644
--- a/main/searchindex.js
+++ b/main/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"alltitles": {"API References": [[1, "api-references"]], "Advanced Usage": [[0, "advanced-usage"]], "Basic Usage": [[48, "basic-usage"]], "Frequently Asked Questions": [[51, "frequently-asked-questions"]], "Glossary": [[52, "glossary"]], "Helpful Commands": [[49, "helpful-commands"]], "Home": [[53, "home"]], "Installation": [[54, "installation"]], "Module contents": [[38, "module-arlbench"], [39, "module-arlbench.autorl"], [40, "module-arlbench.core"], [41, "module-arlbench.core.algorithms"], [42, "module-arlbench.core.algorithms.dqn"], [43, "module-arlbench.core.algorithms.ppo"], [44, "module-arlbench.core.algorithms.sac"], [45, "module-arlbench.core.environments"], [46, "module-arlbench.core.wrappers"], [47, "module-arlbench.utils"]], "Submodules": [[38, "submodules"], [39, "submodules"], [40, "submodules"], [41, "submodules"], [42, "submodules"], [43, "submodules"], [44, "submodules"], [45, "submodules"], [46, "submodules"], [47, "submodules"]], "Subpackages": [[38, "subpackages"], [40, "subpackages"], [41, "subpackages"]], "arlbench": [[2, "module-arlbench"], [55, "arlbench"]], "arlbench package": [[38, "arlbench-package"]], "arlbench.arlbench": [[3, "module-arlbench.arlbench"]], "arlbench.arlbench module": [[38, "module-arlbench.arlbench"]], "arlbench.autorl": [[4, "module-arlbench.autorl"]], "arlbench.autorl package": [[39, "arlbench-autorl-package"]], "arlbench.autorl.autorl_env": [[5, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.autorl_env module": [[39, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.checkpointing": [[6, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.checkpointing module": [[39, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.objectives": [[7, "module-arlbench.autorl.objectives"]], "arlbench.autorl.objectives module": [[39, "module-arlbench.autorl.objectives"]], "arlbench.autorl.state_features": [[8, "module-arlbench.autorl.state_features"]], "arlbench.autorl.state_features module": [[39, "module-arlbench.autorl.state_features"]], "arlbench.core": [[9, "module-arlbench.core"]], "arlbench.core package": [[40, "arlbench-core-package"]], "arlbench.core.algorithms": [[10, "module-arlbench.core.algorithms"]], "arlbench.core.algorithms package": [[41, "arlbench-core-algorithms-package"]], "arlbench.core.algorithms.algorithm": [[11, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.algorithm module": [[41, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.buffers": [[12, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.buffers module": [[41, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.common": [[13, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.common module": [[41, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.dqn": [[14, "module-arlbench.core.algorithms.dqn"]], "arlbench.core.algorithms.dqn package": [[42, "arlbench-core-algorithms-dqn-package"]], "arlbench.core.algorithms.dqn.dqn": [[15, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.dqn module": [[42, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.models": [[16, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.dqn.models module": [[42, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.ppo": [[17, "module-arlbench.core.algorithms.ppo"]], "arlbench.core.algorithms.ppo package": [[43, "arlbench-core-algorithms-ppo-package"]], "arlbench.core.algorithms.ppo.models": [[18, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.models module": [[43, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.ppo": [[19, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.ppo.ppo module": [[43, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.prioritised_item_buffer": [[20, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.prioritised_item_buffer module": [[41, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[21, "module-arlbench.core.algorithms.sac"]], "arlbench.core.algorithms.sac package": [[44, "arlbench-core-algorithms-sac-package"]], "arlbench.core.algorithms.sac.models": [[22, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.models module": [[44, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.sac": [[23, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.algorithms.sac.sac module": [[44, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.environments": [[24, "module-arlbench.core.environments"]], "arlbench.core.environments package": [[45, "arlbench-core-environments-package"]], "arlbench.core.environments.autorl_env": [[25, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.autorl_env module": [[45, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.brax_env": [[26, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.brax_env module": [[45, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.envpool_env": [[27, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.envpool_env module": [[45, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.gymnasium_env": [[28, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnasium_env module": [[45, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnax_env": [[29, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.gymnax_env module": [[45, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.make_env": [[30, "arlbench-core-environments-make-env"]], "arlbench.core.environments.make_env module": [[45, "module-arlbench.core.environments.make_env"]], "arlbench.core.environments.xland_env": [[31, "module-arlbench.core.environments.xland_env"]], "arlbench.core.environments.xland_env module": [[45, "module-arlbench.core.environments.xland_env"]], "arlbench.core.running_statistics": [[32, "module-arlbench.core.running_statistics"]], "arlbench.core.running_statistics module": [[40, "module-arlbench.core.running_statistics"]], "arlbench.core.wrappers": [[33, "module-arlbench.core.wrappers"]], "arlbench.core.wrappers package": [[46, "arlbench-core-wrappers-package"]], "arlbench.core.wrappers.flatten_observation": [[34, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.flatten_observation module": [[46, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.wrapper": [[35, "module-arlbench.core.wrappers.wrapper"]], "arlbench.core.wrappers.wrapper module": [[46, "module-arlbench.core.wrappers.wrapper"]], "arlbench.utils": [[36, "module-arlbench.utils"]], "arlbench.utils package": [[47, "arlbench-utils-package"]], "arlbench.utils.common": [[37, "module-arlbench.utils.common"]], "arlbench.utils.common module": [[47, "module-arlbench.utils.common"]]}, "docnames": ["advanced_usage/index", "api", "api/arlbench", "api/arlbench.arlbench", "api/arlbench.autorl", "api/arlbench.autorl.autorl_env", "api/arlbench.autorl.checkpointing", "api/arlbench.autorl.objectives", "api/arlbench.autorl.state_features", "api/arlbench.core", "api/arlbench.core.algorithms", "api/arlbench.core.algorithms.algorithm", "api/arlbench.core.algorithms.buffers", "api/arlbench.core.algorithms.common", "api/arlbench.core.algorithms.dqn", "api/arlbench.core.algorithms.dqn.dqn", "api/arlbench.core.algorithms.dqn.models", "api/arlbench.core.algorithms.ppo", "api/arlbench.core.algorithms.ppo.models", "api/arlbench.core.algorithms.ppo.ppo", "api/arlbench.core.algorithms.prioritised_item_buffer", "api/arlbench.core.algorithms.sac", "api/arlbench.core.algorithms.sac.models", "api/arlbench.core.algorithms.sac.sac", "api/arlbench.core.environments", "api/arlbench.core.environments.autorl_env", "api/arlbench.core.environments.brax_env", "api/arlbench.core.environments.envpool_env", "api/arlbench.core.environments.gymnasium_env", "api/arlbench.core.environments.gymnax_env", "api/arlbench.core.environments.make_env", "api/arlbench.core.environments.xland_env", "api/arlbench.core.running_statistics", "api/arlbench.core.wrappers", "api/arlbench.core.wrappers.flatten_observation", "api/arlbench.core.wrappers.wrapper", "api/arlbench.utils", "api/arlbench.utils.common", "arlbench", "arlbench.autorl", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.sac", "arlbench.core.environments", "arlbench.core.wrappers", "arlbench.utils", "basic_usage/index", "commands", "contributing", "faq", "glossary", "index", "installation", "modules"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["advanced_usage/index.rst", "api.rst", "api/arlbench.rst", "api/arlbench.arlbench.rst", "api/arlbench.autorl.rst", "api/arlbench.autorl.autorl_env.rst", "api/arlbench.autorl.checkpointing.rst", "api/arlbench.autorl.objectives.rst", "api/arlbench.autorl.state_features.rst", "api/arlbench.core.rst", "api/arlbench.core.algorithms.rst", "api/arlbench.core.algorithms.algorithm.rst", "api/arlbench.core.algorithms.buffers.rst", "api/arlbench.core.algorithms.common.rst", "api/arlbench.core.algorithms.dqn.rst", "api/arlbench.core.algorithms.dqn.dqn.rst", "api/arlbench.core.algorithms.dqn.models.rst", "api/arlbench.core.algorithms.ppo.rst", "api/arlbench.core.algorithms.ppo.models.rst", "api/arlbench.core.algorithms.ppo.ppo.rst", "api/arlbench.core.algorithms.prioritised_item_buffer.rst", "api/arlbench.core.algorithms.sac.rst", "api/arlbench.core.algorithms.sac.models.rst", "api/arlbench.core.algorithms.sac.sac.rst", "api/arlbench.core.environments.rst", "api/arlbench.core.environments.autorl_env.rst", "api/arlbench.core.environments.brax_env.rst", "api/arlbench.core.environments.envpool_env.rst", "api/arlbench.core.environments.gymnasium_env.rst", "api/arlbench.core.environments.gymnax_env.rst", "api/arlbench.core.environments.make_env.rst", "api/arlbench.core.environments.xland_env.rst", "api/arlbench.core.running_statistics.rst", "api/arlbench.core.wrappers.rst", "api/arlbench.core.wrappers.flatten_observation.rst", "api/arlbench.core.wrappers.wrapper.rst", "api/arlbench.utils.rst", "api/arlbench.utils.common.rst", "arlbench.rst", "arlbench.autorl.rst", "arlbench.core.rst", "arlbench.core.algorithms.rst", "arlbench.core.algorithms.dqn.rst", "arlbench.core.algorithms.ppo.rst", "arlbench.core.algorithms.sac.rst", "arlbench.core.environments.rst", "arlbench.core.wrappers.rst", "arlbench.utils.rst", "basic_usage/index.rst", "commands.rst", "contributing.rst", "faq.rst", "glossary.rst", "index.rst", "installation.rst", "modules.rst"], "indexentries": {"__call__() (arlbench.autorl.objectives.emissions static method)": [[7, "arlbench.autorl.objectives.Emissions.__call__", false], [39, "arlbench.autorl.objectives.Emissions.__call__", false]], "__call__() (arlbench.autorl.objectives.objective static method)": [[7, "arlbench.autorl.objectives.Objective.__call__", false], [39, "arlbench.autorl.objectives.Objective.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardmean static method)": [[7, "arlbench.autorl.objectives.RewardMean.__call__", false], [39, "arlbench.autorl.objectives.RewardMean.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardstd static method)": [[7, "arlbench.autorl.objectives.RewardStd.__call__", false], [39, "arlbench.autorl.objectives.RewardStd.__call__", false]], "__call__() (arlbench.autorl.objectives.runtime static method)": [[7, "arlbench.autorl.objectives.Runtime.__call__", false], [39, "arlbench.autorl.objectives.Runtime.__call__", false]], "__call__() (arlbench.autorl.state_features.gradinfo static method)": [[8, "arlbench.autorl.state_features.GradInfo.__call__", false], [39, "arlbench.autorl.state_features.GradInfo.__call__", false]], "__call__() (arlbench.autorl.state_features.statefeature static method)": [[8, "arlbench.autorl.state_features.StateFeature.__call__", false], [39, "arlbench.autorl.state_features.StateFeature.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.cnnq method)": [[16, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false], [42, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.mlpq method)": [[16, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false], [42, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false], [43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false], [43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.alphacoef method)": [[22, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false], [44, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacvectorcritic method)": [[22, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false]], "__lt__() (arlbench.autorl.objectives.objective method)": [[7, "arlbench.autorl.objectives.Objective.__lt__", false], [39, "arlbench.autorl.objectives.Objective.__lt__", false]], "__new__() (arlbench.autorl.objectives.objective static method)": [[7, "arlbench.autorl.objectives.Objective.__new__", false], [39, "arlbench.autorl.objectives.Objective.__new__", false]], "__new__() (arlbench.autorl.state_features.statefeature static method)": [[8, "arlbench.autorl.state_features.StateFeature.__new__", false], [39, "arlbench.autorl.state_features.StateFeature.__new__", false]], "action (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.action", false]], "action (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.action", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.action", false]], "action (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.action", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.action", false]], "action (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.action", false], [44, "arlbench.core.algorithms.sac.sac.Transition.action", false]], "action_dim (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.action_dim", false]], "action_dim (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.action_dim", false]], "action_space (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false]], "action_space (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.action_space", false], [39, "arlbench.autorl.AutoRLEnv.action_space", false]], "action_space (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.action_space", false], [38, "arlbench.AutoRLEnv.action_space", false]], "action_space (arlbench.core.environments.brax_env.braxenv property)": [[26, "arlbench.core.environments.brax_env.BraxEnv.action_space", false], [45, "arlbench.core.environments.brax_env.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.braxenv property)": [[24, "arlbench.core.environments.BraxEnv.action_space", false], [45, "arlbench.core.environments.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[27, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false], [45, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.envpoolenv property)": [[24, "arlbench.core.environments.EnvpoolEnv.action_space", false], [45, "arlbench.core.environments.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[28, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false], [45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasiumenv property)": [[24, "arlbench.core.environments.GymnasiumEnv.action_space", false], [45, "arlbench.core.environments.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[29, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false], [45, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.gymnaxenv property)": [[24, "arlbench.core.environments.GymnaxEnv.action_space", false], [45, "arlbench.core.environments.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.xland_env.xlandenv property)": [[31, "arlbench.core.environments.xland_env.XLandEnv.action_space", false], [45, "arlbench.core.environments.xland_env.XLandEnv.action_space", false]], "action_space() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.action_space", false], [45, "arlbench.core.environments.autorl_env.Environment.action_space", false]], "action_space() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.action_space", false], [45, "arlbench.core.environments.Environment.action_space", false]], "action_type (arlbench.core.algorithms.algorithm property)": [[10, "arlbench.core.algorithms.Algorithm.action_type", false], [41, "arlbench.core.algorithms.Algorithm.action_type", false]], "action_type (arlbench.core.algorithms.algorithm.algorithm property)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false]], "activation (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.activation", false]], "activation (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.activation", false]], "activation (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.activation", false]], "activation (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.activation", false]], "actor_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false]], "actor_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false], [44, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false]], "actor_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false]], "actor_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false], [44, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false]], "actor_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false]], "actor_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false]], "advantages (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false]], "advantages (arlbench.core.algorithms.ppo.ppometrics attribute)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false]], "algorithm (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.Algorithm", false], [41, "arlbench.core.algorithms.Algorithm", false]], "algorithm (class in arlbench.core.algorithms.algorithm)": [[11, "arlbench.core.algorithms.algorithm.Algorithm", false], [41, "arlbench.core.algorithms.algorithm.Algorithm", false]], "algorithms (arlbench.autorl.autorl_env.autorlenv attribute)": [[39, "arlbench.autorl.autorl_env.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorl.autorlenv attribute)": [[39, "arlbench.autorl.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorlenv attribute)": [[38, "arlbench.AutoRLEnv.ALGORITHMS", false]], "alpha_init (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.alpha_init", false]], "alpha_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false]], "alpha_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false], [44, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false]], "alpha_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false]], "alpha_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false]], "alphacoef (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.AlphaCoef", false], [44, "arlbench.core.algorithms.sac.models.AlphaCoef", false]], "arlbench": [[2, "module-arlbench", false], [38, "module-arlbench", false]], "arlbench.arlbench": [[3, "module-arlbench.arlbench", false], [38, "module-arlbench.arlbench", false]], "arlbench.autorl": [[4, "module-arlbench.autorl", false], [39, "module-arlbench.autorl", false]], "arlbench.autorl.autorl_env": [[5, "module-arlbench.autorl.autorl_env", false], [39, "module-arlbench.autorl.autorl_env", false]], "arlbench.autorl.checkpointing": [[6, "module-arlbench.autorl.checkpointing", false], [39, "module-arlbench.autorl.checkpointing", false]], "arlbench.autorl.objectives": [[7, "module-arlbench.autorl.objectives", false], [39, "module-arlbench.autorl.objectives", false]], "arlbench.autorl.state_features": [[8, "module-arlbench.autorl.state_features", false], [39, "module-arlbench.autorl.state_features", false]], "arlbench.core": [[9, "module-arlbench.core", false], [40, "module-arlbench.core", false]], "arlbench.core.algorithms": [[10, "module-arlbench.core.algorithms", false], [41, "module-arlbench.core.algorithms", false]], "arlbench.core.algorithms.algorithm": [[11, "module-arlbench.core.algorithms.algorithm", false], [41, "module-arlbench.core.algorithms.algorithm", false]], "arlbench.core.algorithms.buffers": [[12, "module-arlbench.core.algorithms.buffers", false], [41, "module-arlbench.core.algorithms.buffers", false]], "arlbench.core.algorithms.common": [[13, "module-arlbench.core.algorithms.common", false], [41, "module-arlbench.core.algorithms.common", false]], "arlbench.core.algorithms.dqn": [[14, "module-arlbench.core.algorithms.dqn", false], [42, "module-arlbench.core.algorithms.dqn", false]], "arlbench.core.algorithms.dqn.dqn": [[15, "module-arlbench.core.algorithms.dqn.dqn", false], [42, "module-arlbench.core.algorithms.dqn.dqn", false]], "arlbench.core.algorithms.dqn.models": [[16, "module-arlbench.core.algorithms.dqn.models", false], [42, "module-arlbench.core.algorithms.dqn.models", false]], "arlbench.core.algorithms.ppo": [[17, "module-arlbench.core.algorithms.ppo", false], [43, "module-arlbench.core.algorithms.ppo", false]], "arlbench.core.algorithms.ppo.models": [[18, "module-arlbench.core.algorithms.ppo.models", false], [43, "module-arlbench.core.algorithms.ppo.models", false]], "arlbench.core.algorithms.ppo.ppo": [[19, "module-arlbench.core.algorithms.ppo.ppo", false], [43, "module-arlbench.core.algorithms.ppo.ppo", false]], "arlbench.core.algorithms.prioritised_item_buffer": [[20, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [41, "module-arlbench.core.algorithms.prioritised_item_buffer", false]], "arlbench.core.algorithms.sac": [[21, "module-arlbench.core.algorithms.sac", false], [44, "module-arlbench.core.algorithms.sac", false]], "arlbench.core.algorithms.sac.models": [[22, "module-arlbench.core.algorithms.sac.models", false], [44, "module-arlbench.core.algorithms.sac.models", false]], "arlbench.core.algorithms.sac.sac": [[23, "module-arlbench.core.algorithms.sac.sac", false], [44, "module-arlbench.core.algorithms.sac.sac", false]], "arlbench.core.environments": [[24, "module-arlbench.core.environments", false], [45, "module-arlbench.core.environments", false]], "arlbench.core.environments.autorl_env": [[25, "module-arlbench.core.environments.autorl_env", false], [45, "module-arlbench.core.environments.autorl_env", false]], "arlbench.core.environments.brax_env": [[26, "module-arlbench.core.environments.brax_env", false], [45, "module-arlbench.core.environments.brax_env", false]], "arlbench.core.environments.envpool_env": [[27, "module-arlbench.core.environments.envpool_env", false], [45, "module-arlbench.core.environments.envpool_env", false]], "arlbench.core.environments.gymnasium_env": [[28, "module-arlbench.core.environments.gymnasium_env", false], [45, "module-arlbench.core.environments.gymnasium_env", false]], "arlbench.core.environments.gymnax_env": [[29, "module-arlbench.core.environments.gymnax_env", false], [45, "module-arlbench.core.environments.gymnax_env", false]], "arlbench.core.environments.make_env": [[45, "module-arlbench.core.environments.make_env", false]], "arlbench.core.environments.xland_env": [[31, "module-arlbench.core.environments.xland_env", false], [45, "module-arlbench.core.environments.xland_env", false]], "arlbench.core.running_statistics": [[32, "module-arlbench.core.running_statistics", false], [40, "module-arlbench.core.running_statistics", false]], "arlbench.core.wrappers": [[33, "module-arlbench.core.wrappers", false], [46, "module-arlbench.core.wrappers", false]], "arlbench.core.wrappers.flatten_observation": [[34, "module-arlbench.core.wrappers.flatten_observation", false], [46, "module-arlbench.core.wrappers.flatten_observation", false]], "arlbench.core.wrappers.wrapper": [[35, "module-arlbench.core.wrappers.wrapper", false], [46, "module-arlbench.core.wrappers.wrapper", false]], "arlbench.utils": [[36, "module-arlbench.utils", false], [47, "module-arlbench.utils", false]], "arlbench.utils.common": [[37, "module-arlbench.utils.common", false], [47, "module-arlbench.utils.common", false]], "automl": [[52, "term-AutoML", true]], "autorl": [[52, "term-AutoRL", true]], "autorlenv (class in arlbench)": [[2, "arlbench.AutoRLEnv", false], [38, "arlbench.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl)": [[4, "arlbench.autorl.AutoRLEnv", false], [39, "arlbench.autorl.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl.autorl_env)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv", false]], "bo": [[52, "term-BO", true]], "braxenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.BraxEnv", false], [45, "arlbench.core.environments.BraxEnv", false]], "braxenv (class in arlbench.core.environments.brax_env)": [[26, "arlbench.core.environments.brax_env.BraxEnv", false], [45, "arlbench.core.environments.brax_env.BraxEnv", false]], "buffer_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false], [42, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[17, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false], [43, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false], [44, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sacstate attribute)": [[21, "arlbench.core.algorithms.sac.SACState.buffer_state", false], [44, "arlbench.core.algorithms.sac.SACState.buffer_state", false]], "checkpointer (class in arlbench.autorl.checkpointing)": [[6, "arlbench.autorl.checkpointing.Checkpointer", false], [39, "arlbench.autorl.checkpointing.Checkpointer", false]], "checkpoints (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.checkpoints", false], [39, "arlbench.autorl.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.checkpoints", false], [38, "arlbench.AutoRLEnv.checkpoints", false]], "cnnactorcritic (class in arlbench.core.algorithms.ppo.models)": [[18, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false], [43, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false]], "cnnq (class in arlbench.core.algorithms.dqn.models)": [[16, "arlbench.core.algorithms.dqn.models.CNNQ", false], [42, "arlbench.core.algorithms.dqn.models.CNNQ", false]], "config (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.config", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.config", false]], "config (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.config", false], [39, "arlbench.autorl.AutoRLEnv.config", false]], "config (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.config", false], [38, "arlbench.AutoRLEnv.config", false]], "config_space (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false]], "config_space (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.config_space", false], [39, "arlbench.autorl.AutoRLEnv.config_space", false]], "config_space (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.config_space", false], [38, "arlbench.AutoRLEnv.config_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils)": [[36, "arlbench.utils.config_space_to_gymnasium_space", false], [47, "arlbench.utils.config_space_to_gymnasium_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.config_space_to_gymnasium_space", false], [47, "arlbench.utils.common.config_space_to_gymnasium_space", false]], "config_space_to_yaml() (in module arlbench.utils)": [[36, "arlbench.utils.config_space_to_yaml", false], [47, "arlbench.utils.config_space_to_yaml", false]], "config_space_to_yaml() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.config_space_to_yaml", false], [47, "arlbench.utils.common.config_space_to_yaml", false]], "count (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[40, "arlbench.core.running_statistics.RunningStatisticsState.count", false]], "create_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[20, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false], [41, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false]], "create_with_opt_state() (arlbench.core.algorithms.dqn.dqn.dqntrainstate class method)": [[42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.ppo.ppo.ppotrainstate class method)": [[43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.sac.sac.sactrainstate class method)": [[44, "arlbench.core.algorithms.sac.sac.SACTrainState.create_with_opt_state", false]], "critic (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.critic", false]], "critic_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false]], "critic_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false], [44, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false]], "critic_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false]], "critic_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false], [44, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false]], "critic_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false]], "critic_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false]], "cur_rewards (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false]], "cur_rewards (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false]], "denormalize() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.denormalize", false], [40, "arlbench.core.running_statistics.denormalize", false]], "discrete (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.discrete", false]], "discrete (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.discrete", false]], "done (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.done", false]], "done (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.done", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.done", false]], "done (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.done", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.done", false]], "done (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.done", false], [44, "arlbench.core.algorithms.sac.sac.Transition.done", false]], "dqn": [[52, "term-DQN", true]], "dqn (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.DQN", false], [41, "arlbench.core.algorithms.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQN", false], [42, "arlbench.core.algorithms.dqn.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false]], "dqnstate (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNState", false], [42, "arlbench.core.algorithms.dqn.DQNState", false]], "dqnstate (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNState", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNState", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false]], "dqntrainreturnt (in module arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false], [42, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false]], "dqntrainstate (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false]], "emissions (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.Emissions", false], [39, "arlbench.autorl.objectives.Emissions", false]], "env_name (arlbench.core.environments.autorl_env.environment property)": [[25, "arlbench.core.environments.autorl_env.Environment.env_name", false], [45, "arlbench.core.environments.autorl_env.Environment.env_name", false]], "env_name (arlbench.core.environments.environment property)": [[24, "arlbench.core.environments.Environment.env_name", false], [45, "arlbench.core.environments.Environment.env_name", false]], "env_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false]], "environment (class in arlbench.core.environments)": [[24, "arlbench.core.environments.Environment", false], [45, "arlbench.core.environments.Environment", false]], "environment (class in arlbench.core.environments.autorl_env)": [[25, "arlbench.core.environments.autorl_env.Environment", false], [45, "arlbench.core.environments.autorl_env.Environment", false]], "envpoolenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.EnvpoolEnv", false], [45, "arlbench.core.environments.EnvpoolEnv", false]], "envpoolenv (class in arlbench.core.environments.envpool_env)": [[27, "arlbench.core.environments.envpool_env.EnvpoolEnv", false], [45, "arlbench.core.environments.envpool_env.EnvpoolEnv", false]], "eval() (arlbench.autorl.autorl_env.autorlenv method)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false]], "eval() (arlbench.autorl.autorlenv method)": [[4, "arlbench.autorl.AutoRLEnv.eval", false], [39, "arlbench.autorl.AutoRLEnv.eval", false]], "eval() (arlbench.autorlenv method)": [[2, "arlbench.AutoRLEnv.eval", false], [38, "arlbench.AutoRLEnv.eval", false]], "eval() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.eval", false], [41, "arlbench.core.algorithms.Algorithm.eval", false]], "eval() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.eval", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.eval", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false]], "flattenobservationwrapper (class in arlbench.core.wrappers)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper", false]], "flattenobservationwrapper (class in arlbench.core.wrappers.flatten_observation)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false]], "from_tuple() (arlbench.core.algorithms.common.timestep method)": [[41, "arlbench.core.algorithms.common.TimeStep.from_tuple", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false], [42, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false], [43, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false], [41, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_default_hpo_config", false], [41, "arlbench.core.algorithms.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false], [42, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_default_hpo_config", false], [41, "arlbench.core.algorithms.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false], [43, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_default_hpo_config", false], [41, "arlbench.core.algorithms.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false], [44, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false], [41, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_default_nas_config", false], [41, "arlbench.core.algorithms.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false], [42, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_default_nas_config", false], [41, "arlbench.core.algorithms.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false], [43, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_default_nas_config", false], [41, "arlbench.core.algorithms.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false], [44, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false], [41, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_hpo_config_space", false], [41, "arlbench.core.algorithms.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false], [42, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_hpo_config_space", false], [41, "arlbench.core.algorithms.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false], [43, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_hpo_config_space", false], [41, "arlbench.core.algorithms.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false], [44, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false], [41, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_hpo_search_space", false], [41, "arlbench.core.algorithms.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false], [42, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_hpo_search_space", false], [41, "arlbench.core.algorithms.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false], [43, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_hpo_search_space", false], [41, "arlbench.core.algorithms.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false], [44, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false], [41, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_nas_config_space", false], [41, "arlbench.core.algorithms.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false], [42, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_nas_config_space", false], [41, "arlbench.core.algorithms.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false], [43, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_nas_config_space", false], [41, "arlbench.core.algorithms.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false], [44, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false]], "get_spec() (arlbench.autorl.objectives.emissions static method)": [[7, "arlbench.autorl.objectives.Emissions.get_spec", false], [39, "arlbench.autorl.objectives.Emissions.get_spec", false]], "get_spec() (arlbench.autorl.objectives.objective static method)": [[7, "arlbench.autorl.objectives.Objective.get_spec", false], [39, "arlbench.autorl.objectives.Objective.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardmean static method)": [[7, "arlbench.autorl.objectives.RewardMean.get_spec", false], [39, "arlbench.autorl.objectives.RewardMean.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardstd static method)": [[7, "arlbench.autorl.objectives.RewardStd.get_spec", false], [39, "arlbench.autorl.objectives.RewardStd.get_spec", false]], "get_spec() (arlbench.autorl.objectives.runtime static method)": [[7, "arlbench.autorl.objectives.Runtime.get_spec", false], [39, "arlbench.autorl.objectives.Runtime.get_spec", false]], "get_state_space() (arlbench.autorl.state_features.gradinfo static method)": [[8, "arlbench.autorl.state_features.GradInfo.get_state_space", false], [39, "arlbench.autorl.state_features.GradInfo.get_state_space", false]], "get_state_space() (arlbench.autorl.state_features.statefeature static method)": [[8, "arlbench.autorl.state_features.StateFeature.get_state_space", false], [39, "arlbench.autorl.state_features.StateFeature.get_state_space", false]], "global_step (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false]], "gradinfo (class in arlbench.autorl.state_features)": [[8, "arlbench.autorl.state_features.GradInfo", false], [39, "arlbench.autorl.state_features.GradInfo", false]], "grads (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppometrics attribute)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils)": [[36, "arlbench.utils.gymnasium_space_to_gymnax_space", false], [47, "arlbench.utils.gymnasium_space_to_gymnax_space", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false], [47, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false]], "gymnasiumenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.GymnasiumEnv", false], [45, "arlbench.core.environments.GymnasiumEnv", false]], "gymnasiumenv (class in arlbench.core.environments.gymnasium_env)": [[28, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false], [45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false]], "gymnaxenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.GymnaxEnv", false], [45, "arlbench.core.environments.GymnaxEnv", false]], "gymnaxenv (class in arlbench.core.environments.gymnax_env)": [[29, "arlbench.core.environments.gymnax_env.GymnaxEnv", false], [45, "arlbench.core.environments.gymnax_env.GymnaxEnv", false]], "hidden_size (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.hidden_size", false]], "hpo": [[52, "term-HPO", true]], "hpo_config (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.hpo_config", false], [39, "arlbench.autorl.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.hpo_config", false], [38, "arlbench.AutoRLEnv.hpo_config", false]], "info (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.info", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.info", false]], "info (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.info", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.info", false]], "info (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.info", false], [44, "arlbench.core.algorithms.sac.sac.Transition.info", false]], "init() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.init", false], [41, "arlbench.core.algorithms.Algorithm.init", false]], "init() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.init", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.init", false]], "init() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.init", false], [41, "arlbench.core.algorithms.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.init", false], [42, "arlbench.core.algorithms.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.init", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.ppo method)": [[10, "arlbench.core.algorithms.PPO.init", false], [41, "arlbench.core.algorithms.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo method)": [[17, "arlbench.core.algorithms.ppo.PPO.init", false], [43, "arlbench.core.algorithms.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.init", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.init", false], [41, "arlbench.core.algorithms.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.init", false], [44, "arlbench.core.algorithms.sac.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.init", false], [44, "arlbench.core.algorithms.sac.sac.SAC.init", false]], "init_state() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.init_state", false], [40, "arlbench.core.running_statistics.init_state", false]], "items() (arlbench.core.algorithms.common.timestep method)": [[13, "arlbench.core.algorithms.common.TimeStep.items", false], [41, "arlbench.core.algorithms.common.TimeStep.items", false]], "key (arlbench.autorl.objectives.emissions attribute)": [[39, "arlbench.autorl.objectives.Emissions.KEY", false]], "key (arlbench.autorl.objectives.objective attribute)": [[39, "arlbench.autorl.objectives.Objective.KEY", false]], "key (arlbench.autorl.objectives.rewardmean attribute)": [[39, "arlbench.autorl.objectives.RewardMean.KEY", false]], "key (arlbench.autorl.objectives.rewardstd attribute)": [[39, "arlbench.autorl.objectives.RewardStd.KEY", false]], "key (arlbench.autorl.objectives.runtime attribute)": [[39, "arlbench.autorl.objectives.Runtime.KEY", false]], "key (arlbench.autorl.state_features.gradinfo attribute)": [[39, "arlbench.autorl.state_features.GradInfo.KEY", false]], "key (arlbench.autorl.state_features.statefeature attribute)": [[39, "arlbench.autorl.state_features.StateFeature.KEY", false]], "keys() (arlbench.core.algorithms.common.timestep method)": [[13, "arlbench.core.algorithms.common.TimeStep.keys", false], [41, "arlbench.core.algorithms.common.TimeStep.keys", false]], "last_obs (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.last_obs", false]], "load() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.load", false], [39, "arlbench.autorl.checkpointing.Checkpointer.load", false]], "load_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false], [39, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false]], "log_prob (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false]], "log_std_max (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_max", false]], "log_std_max (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_max", false]], "log_std_min (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_min", false]], "log_std_min (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_min", false]], "loss (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppometrics attribute)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false]], "make_env() (in module arlbench.core.environments)": [[24, "arlbench.core.environments.make_env", false], [30, "arlbench.core.environments.make_env", false], [45, "arlbench.core.environments.make_env", false]], "make_env() (in module arlbench.core.environments.make_env)": [[45, "arlbench.core.environments.make_env.make_env", false]], "make_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[20, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false], [41, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false]], "mean (arlbench.core.running_statistics.nestedmeanstd attribute)": [[40, "arlbench.core.running_statistics.NestedMeanStd.mean", false]], "metrics (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false]], "mlpactorcritic (class in arlbench.core.algorithms.ppo.models)": [[18, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false], [43, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false]], "mlpq (class in arlbench.core.algorithms.dqn.models)": [[16, "arlbench.core.algorithms.dqn.models.MLPQ", false], [42, "arlbench.core.algorithms.dqn.models.MLPQ", false]], "mode() (arlbench.core.algorithms.sac.models.tanhtransformeddistribution method)": [[22, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false], [44, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false]], "module": [[2, "module-arlbench", false], [3, "module-arlbench.arlbench", false], [4, "module-arlbench.autorl", false], [5, "module-arlbench.autorl.autorl_env", false], [6, "module-arlbench.autorl.checkpointing", false], [7, "module-arlbench.autorl.objectives", false], [8, "module-arlbench.autorl.state_features", false], [9, "module-arlbench.core", false], [10, "module-arlbench.core.algorithms", false], [11, "module-arlbench.core.algorithms.algorithm", false], [12, "module-arlbench.core.algorithms.buffers", false], [13, "module-arlbench.core.algorithms.common", false], [14, "module-arlbench.core.algorithms.dqn", false], [15, "module-arlbench.core.algorithms.dqn.dqn", false], [16, "module-arlbench.core.algorithms.dqn.models", false], [17, "module-arlbench.core.algorithms.ppo", false], [18, "module-arlbench.core.algorithms.ppo.models", false], [19, "module-arlbench.core.algorithms.ppo.ppo", false], [20, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [21, "module-arlbench.core.algorithms.sac", false], [22, "module-arlbench.core.algorithms.sac.models", false], [23, "module-arlbench.core.algorithms.sac.sac", false], [24, "module-arlbench.core.environments", false], [25, "module-arlbench.core.environments.autorl_env", false], [26, "module-arlbench.core.environments.brax_env", false], [27, "module-arlbench.core.environments.envpool_env", false], [28, "module-arlbench.core.environments.gymnasium_env", false], [29, "module-arlbench.core.environments.gymnax_env", false], [31, "module-arlbench.core.environments.xland_env", false], [32, "module-arlbench.core.running_statistics", false], [33, "module-arlbench.core.wrappers", false], [34, "module-arlbench.core.wrappers.flatten_observation", false], [35, "module-arlbench.core.wrappers.wrapper", false], [36, "module-arlbench.utils", false], [37, "module-arlbench.utils.common", false], [38, "module-arlbench", false], [38, "module-arlbench.arlbench", false], [39, "module-arlbench.autorl", false], [39, "module-arlbench.autorl.autorl_env", false], [39, "module-arlbench.autorl.checkpointing", false], [39, "module-arlbench.autorl.objectives", false], [39, "module-arlbench.autorl.state_features", false], [40, "module-arlbench.core", false], [40, "module-arlbench.core.running_statistics", false], [41, "module-arlbench.core.algorithms", false], [41, "module-arlbench.core.algorithms.algorithm", false], [41, "module-arlbench.core.algorithms.buffers", false], [41, "module-arlbench.core.algorithms.common", false], [41, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [42, "module-arlbench.core.algorithms.dqn", false], [42, "module-arlbench.core.algorithms.dqn.dqn", false], [42, "module-arlbench.core.algorithms.dqn.models", false], [43, "module-arlbench.core.algorithms.ppo", false], [43, "module-arlbench.core.algorithms.ppo.models", false], [43, "module-arlbench.core.algorithms.ppo.ppo", false], [44, "module-arlbench.core.algorithms.sac", false], [44, "module-arlbench.core.algorithms.sac.models", false], [44, "module-arlbench.core.algorithms.sac.sac", false], [45, "module-arlbench.core.environments", false], [45, "module-arlbench.core.environments.autorl_env", false], [45, "module-arlbench.core.environments.brax_env", false], [45, "module-arlbench.core.environments.envpool_env", false], [45, "module-arlbench.core.environments.gymnasium_env", false], [45, "module-arlbench.core.environments.gymnax_env", false], [45, "module-arlbench.core.environments.make_env", false], [45, "module-arlbench.core.environments.xland_env", false], [46, "module-arlbench.core.wrappers", false], [46, "module-arlbench.core.wrappers.flatten_observation", false], [46, "module-arlbench.core.wrappers.wrapper", false], [47, "module-arlbench.utils", false], [47, "module-arlbench.utils.common", false]], "mrp_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[39, "arlbench.autorl.checkpointing.Checkpointer.MRP_FILE", false]], "multi-fidelity optimization": [[52, "term-Multi-fidelity-optimization", true]], "n_critics (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.n_critics", false]], "n_envs (arlbench.core.environments.autorl_env.environment property)": [[25, "arlbench.core.environments.autorl_env.Environment.n_envs", false], [45, "arlbench.core.environments.autorl_env.Environment.n_envs", false]], "n_envs (arlbench.core.environments.environment property)": [[24, "arlbench.core.environments.Environment.n_envs", false], [45, "arlbench.core.environments.Environment.n_envs", false]], "name (arlbench.core.algorithms.algorithm attribute)": [[41, "arlbench.core.algorithms.Algorithm.name", false]], "name (arlbench.core.algorithms.algorithm.algorithm attribute)": [[41, "arlbench.core.algorithms.algorithm.Algorithm.name", false]], "name (arlbench.core.algorithms.dqn attribute)": [[41, "arlbench.core.algorithms.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn attribute)": [[42, "arlbench.core.algorithms.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn.dqn attribute)": [[42, "arlbench.core.algorithms.dqn.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.name", false]], "name (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.name", false]], "name (arlbench.core.algorithms.ppo attribute)": [[41, "arlbench.core.algorithms.PPO.name", false]], "name (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.ppo attribute)": [[43, "arlbench.core.algorithms.ppo.PPO.name", false]], "name (arlbench.core.algorithms.ppo.ppo.ppo attribute)": [[43, "arlbench.core.algorithms.ppo.ppo.PPO.name", false]], "name (arlbench.core.algorithms.sac attribute)": [[41, "arlbench.core.algorithms.SAC.name", false]], "name (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.name", false]], "name (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.name", false]], "name (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.name", false]], "name (arlbench.core.algorithms.sac.sac attribute)": [[44, "arlbench.core.algorithms.sac.SAC.name", false]], "name (arlbench.core.algorithms.sac.sac.sac attribute)": [[44, "arlbench.core.algorithms.sac.sac.SAC.name", false]], "nestedmeanstd (class in arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.NestedMeanStd", false], [40, "arlbench.core.running_statistics.NestedMeanStd", false]], "network_state (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[44, "arlbench.core.algorithms.sac.sac.SACTrainState.network_state", false]], "nodes_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[39, "arlbench.autorl.checkpointing.Checkpointer.NODES_FILE", false]], "normalize() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.normalize", false], [40, "arlbench.core.running_statistics.normalize", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false]], "numpy_to_jax() (in module arlbench.core.environments.envpool_env)": [[27, "arlbench.core.environments.envpool_env.numpy_to_jax", false], [45, "arlbench.core.environments.envpool_env.numpy_to_jax", false]], "objective (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.Objective", false], [39, "arlbench.autorl.objectives.Objective", false]], "objectives (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false]], "objectives (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.objectives", false], [39, "arlbench.autorl.AutoRLEnv.objectives", false]], "objectives (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.objectives", false], [38, "arlbench.AutoRLEnv.objectives", false]], "obs (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false]], "obs (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false]], "obs (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.obs", false], [44, "arlbench.core.algorithms.sac.sac.Transition.obs", false]], "obs (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.obs", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.obs", false]], "observation_space (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.observation_space", false], [39, "arlbench.autorl.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.observation_space", false], [38, "arlbench.AutoRLEnv.observation_space", false]], "observation_space (arlbench.core.environments.brax_env.braxenv property)": [[26, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false], [45, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.braxenv property)": [[24, "arlbench.core.environments.BraxEnv.observation_space", false], [45, "arlbench.core.environments.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[27, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false], [45, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpoolenv property)": [[24, "arlbench.core.environments.EnvpoolEnv.observation_space", false], [45, "arlbench.core.environments.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[28, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false], [45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasiumenv property)": [[24, "arlbench.core.environments.GymnasiumEnv.observation_space", false], [45, "arlbench.core.environments.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[29, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false], [45, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnaxenv property)": [[24, "arlbench.core.environments.GymnaxEnv.observation_space", false], [45, "arlbench.core.environments.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.xland_env.xlandenv property)": [[31, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false], [45, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false]], "observation_space (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper property)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false]], "observation_space (arlbench.core.wrappers.flattenobservationwrapper property)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false]], "observation_space() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.observation_space", false], [45, "arlbench.core.environments.autorl_env.Environment.observation_space", false]], "observation_space() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.observation_space", false], [45, "arlbench.core.environments.Environment.observation_space", false]], "opt_state (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.opt_state", false]], "opt_state (arlbench.core.algorithms.ppo.ppo.ppotrainstate attribute)": [[43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.opt_state", false]], "parent (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.parent", false]], "parent (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.parent", false]], "parent (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.parent", false]], "parent (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.parent", false]], "ppo": [[52, "term-PPO", true]], "ppo (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.PPO", false], [41, "arlbench.core.algorithms.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPO", false], [43, "arlbench.core.algorithms.ppo.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO", false]], "ppometrics (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics", false]], "ppometrics (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false]], "ppostate (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOState", false], [43, "arlbench.core.algorithms.ppo.PPOState", false]], "ppostate (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOState", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOState", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false]], "ppotrainreturnt (in module arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false], [43, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false]], "ppotrainstate (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false]], "predict() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.predict", false], [41, "arlbench.core.algorithms.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.predict", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.predict", false], [41, "arlbench.core.algorithms.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.predict", false], [42, "arlbench.core.algorithms.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.ppo method)": [[10, "arlbench.core.algorithms.PPO.predict", false], [41, "arlbench.core.algorithms.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo method)": [[17, "arlbench.core.algorithms.ppo.PPO.predict", false], [43, "arlbench.core.algorithms.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.predict", false], [41, "arlbench.core.algorithms.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.predict", false], [44, "arlbench.core.algorithms.sac.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.predict", false], [44, "arlbench.core.algorithms.sac.sac.SAC.predict", false]], "random search": [[52, "term-Random-Search", true]], "rank (arlbench.autorl.objectives.emissions attribute)": [[39, "arlbench.autorl.objectives.Emissions.RANK", false]], "rank (arlbench.autorl.objectives.objective attribute)": [[39, "arlbench.autorl.objectives.Objective.RANK", false]], "rank (arlbench.autorl.objectives.rewardmean attribute)": [[39, "arlbench.autorl.objectives.RewardMean.RANK", false]], "rank (arlbench.autorl.objectives.rewardstd attribute)": [[39, "arlbench.autorl.objectives.RewardStd.RANK", false]], "rank (arlbench.autorl.objectives.runtime attribute)": [[39, "arlbench.autorl.objectives.Runtime.RANK", false]], "recursive_concat() (in module arlbench.utils)": [[36, "arlbench.utils.recursive_concat", false], [47, "arlbench.utils.recursive_concat", false]], "recursive_concat() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.recursive_concat", false], [47, "arlbench.utils.common.recursive_concat", false]], "replace() (arlbench.core.algorithms.common.timestep method)": [[41, "arlbench.core.algorithms.common.TimeStep.replace", false]], "replace() (arlbench.core.algorithms.dqn.dqn.dqntrainstate method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false]], "replace() (arlbench.core.algorithms.ppo.ppo.ppotrainstate method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false]], "replace() (arlbench.core.algorithms.sac.sac.sactrainstate method)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false]], "replace() (arlbench.core.running_statistics.nestedmeanstd method)": [[32, "arlbench.core.running_statistics.NestedMeanStd.replace", false], [40, "arlbench.core.running_statistics.NestedMeanStd.replace", false]], "replace() (arlbench.core.running_statistics.runningstatisticsstate method)": [[32, "arlbench.core.running_statistics.RunningStatisticsState.replace", false], [40, "arlbench.core.running_statistics.RunningStatisticsState.replace", false]], "reset() (arlbench.autorl.autorl_env.autorlenv method)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false]], "reset() (arlbench.autorl.autorlenv method)": [[4, "arlbench.autorl.AutoRLEnv.reset", false], [39, "arlbench.autorl.AutoRLEnv.reset", false]], "reset() (arlbench.autorlenv method)": [[2, "arlbench.AutoRLEnv.reset", false], [38, "arlbench.AutoRLEnv.reset", false]], "reset() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.reset", false], [45, "arlbench.core.environments.autorl_env.Environment.reset", false]], "reset() (arlbench.core.environments.brax_env.braxenv method)": [[45, "arlbench.core.environments.brax_env.BraxEnv.reset", false]], "reset() (arlbench.core.environments.braxenv method)": [[45, "arlbench.core.environments.BraxEnv.reset", false]], "reset() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.reset", false], [45, "arlbench.core.environments.Environment.reset", false]], "reset() (arlbench.core.environments.envpool_env.envpoolenv method)": [[45, "arlbench.core.environments.envpool_env.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.envpoolenv method)": [[45, "arlbench.core.environments.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnasiumenv method)": [[45, "arlbench.core.environments.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[45, "arlbench.core.environments.gymnax_env.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.gymnaxenv method)": [[45, "arlbench.core.environments.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.xland_env.xlandenv method)": [[45, "arlbench.core.environments.xland_env.XLandEnv.reset", false]], "reset() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false]], "reset() (arlbench.core.wrappers.flattenobservationwrapper method)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false]], "return_buffer (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false]], "return_buffer (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false]], "reward (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.reward", false]], "reward (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false]], "reward (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false]], "reward (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.reward", false], [44, "arlbench.core.algorithms.sac.sac.Transition.reward", false]], "rewardmean (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.RewardMean", false], [39, "arlbench.autorl.objectives.RewardMean", false]], "rewardstd (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.RewardStd", false], [39, "arlbench.autorl.objectives.RewardStd", false]], "rng (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.rng", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.rng", false]], "run_arlbench() (in module arlbench)": [[2, "arlbench.run_arlbench", false], [38, "arlbench.run_arlbench", false]], "run_arlbench() (in module arlbench.arlbench)": [[3, "arlbench.arlbench.run_arlbench", false], [38, "arlbench.arlbench.run_arlbench", false]], "runner_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNState.runner_state", false], [42, "arlbench.core.algorithms.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[17, "arlbench.core.algorithms.ppo.PPOState.runner_state", false], [43, "arlbench.core.algorithms.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false], [44, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sacstate attribute)": [[21, "arlbench.core.algorithms.sac.SACState.runner_state", false], [44, "arlbench.core.algorithms.sac.SACState.runner_state", false]], "runningstatisticsstate (class in arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.RunningStatisticsState", false], [40, "arlbench.core.running_statistics.RunningStatisticsState", false]], "runtime (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.Runtime", false], [39, "arlbench.autorl.objectives.Runtime", false]], "sac": [[52, "term-SAC", true]], "sac (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.SAC", false], [41, "arlbench.core.algorithms.SAC", false]], "sac (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SAC", false], [44, "arlbench.core.algorithms.sac.SAC", false]], "sac (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SAC", false], [44, "arlbench.core.algorithms.sac.sac.SAC", false]], "saccnnactor (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACCNNActor", false], [44, "arlbench.core.algorithms.sac.models.SACCNNActor", false]], "saccnncritic (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACCNNCritic", false], [44, "arlbench.core.algorithms.sac.models.SACCNNCritic", false]], "sacmetrics (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACMetrics", false], [44, "arlbench.core.algorithms.sac.SACMetrics", false]], "sacmetrics (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics", false]], "sacmlpactor (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACMLPActor", false], [44, "arlbench.core.algorithms.sac.models.SACMLPActor", false]], "sacmlpcritic (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACMLPCritic", false], [44, "arlbench.core.algorithms.sac.models.SACMLPCritic", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACRunnerState", false], [44, "arlbench.core.algorithms.sac.SACRunnerState", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState", false]], "sacstate (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACState", false], [44, "arlbench.core.algorithms.sac.SACState", false]], "sacstate (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACState", false], [44, "arlbench.core.algorithms.sac.sac.SACState", false]], "sactrainingresult (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult", false]], "sactrainingresult (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false]], "sactrainreturnt (in module arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACTrainReturnT", false], [44, "arlbench.core.algorithms.sac.SACTrainReturnT", false]], "sactrainstate (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainState", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainState", false]], "sacvectorcritic (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACVectorCritic", false], [44, "arlbench.core.algorithms.sac.models.SACVectorCritic", false]], "sample_action() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[45, "arlbench.core.environments.gymnax_env.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.gymnaxenv method)": [[45, "arlbench.core.environments.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.xland_env.xlandenv method)": [[45, "arlbench.core.environments.xland_env.XLandEnv.sample_action", false]], "sample_actions() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.sample_actions", false], [45, "arlbench.core.environments.autorl_env.Environment.sample_actions", false]], "sample_actions() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.sample_actions", false], [45, "arlbench.core.environments.Environment.sample_actions", false]], "save() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.save", false], [39, "arlbench.autorl.checkpointing.Checkpointer.save", false]], "save_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false], [39, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false]], "save_defaults_to_yaml() (in module arlbench.utils)": [[36, "arlbench.utils.save_defaults_to_yaml", false], [47, "arlbench.utils.save_defaults_to_yaml", false]], "save_defaults_to_yaml() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.save_defaults_to_yaml", false], [47, "arlbench.utils.common.save_defaults_to_yaml", false]], "scalars_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[39, "arlbench.autorl.checkpointing.Checkpointer.SCALARS_FILE", false]], "scope (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.scope", false]], "scope (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.scope", false]], "scope (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.scope", false]], "scope (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.scope", false]], "setup() (arlbench.core.algorithms.dqn.models.cnnq method)": [[16, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false], [42, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false]], "setup() (arlbench.core.algorithms.dqn.models.mlpq method)": [[16, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false], [42, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false], [43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false], [43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.alphacoef method)": [[22, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false], [44, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false], [44, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false], [44, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false], [44, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false], [44, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false]], "statefeature (class in arlbench.autorl.state_features)": [[8, "arlbench.autorl.state_features.StateFeature", false], [39, "arlbench.autorl.state_features.StateFeature", false]], "std (arlbench.core.running_statistics.nestedmeanstd attribute)": [[40, "arlbench.core.running_statistics.NestedMeanStd.std", false]], "step() (arlbench.autorl.autorl_env.autorlenv method)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.step", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.step", false]], "step() (arlbench.autorl.autorlenv method)": [[4, "arlbench.autorl.AutoRLEnv.step", false], [39, "arlbench.autorl.AutoRLEnv.step", false]], "step() (arlbench.autorlenv method)": [[2, "arlbench.AutoRLEnv.step", false], [38, "arlbench.AutoRLEnv.step", false]], "step() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.step", false], [45, "arlbench.core.environments.autorl_env.Environment.step", false]], "step() (arlbench.core.environments.brax_env.braxenv method)": [[45, "arlbench.core.environments.brax_env.BraxEnv.step", false]], "step() (arlbench.core.environments.braxenv method)": [[45, "arlbench.core.environments.BraxEnv.step", false]], "step() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.step", false], [45, "arlbench.core.environments.Environment.step", false]], "step() (arlbench.core.environments.envpool_env.envpoolenv method)": [[45, "arlbench.core.environments.envpool_env.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.envpoolenv method)": [[45, "arlbench.core.environments.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnasiumenv method)": [[45, "arlbench.core.environments.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[45, "arlbench.core.environments.gymnax_env.GymnaxEnv.step", false]], "step() (arlbench.core.environments.gymnaxenv method)": [[45, "arlbench.core.environments.GymnaxEnv.step", false]], "step() (arlbench.core.environments.xland_env.xlandenv method)": [[45, "arlbench.core.environments.xland_env.XLandEnv.step", false]], "step() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false]], "step() (arlbench.core.wrappers.flattenobservationwrapper method)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper.step", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper.step", false]], "summed_variance (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[40, "arlbench.core.running_statistics.RunningStatisticsState.summed_variance", false]], "tanhtransformeddistribution (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false], [44, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false]], "target_params (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.target_params", false]], "target_params (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[44, "arlbench.core.algorithms.sac.sac.SACTrainState.target_params", false]], "td_error (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.td_error", false], [44, "arlbench.core.algorithms.sac.SACMetrics.td_error", false]], "timestep (class in arlbench.core.algorithms.common)": [[13, "arlbench.core.algorithms.common.TimeStep", false], [41, "arlbench.core.algorithms.common.TimeStep", false]], "to_tuple() (arlbench.core.algorithms.common.timestep method)": [[41, "arlbench.core.algorithms.common.TimeStep.to_tuple", false]], "train() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.train", false], [41, "arlbench.core.algorithms.Algorithm.train", false]], "train() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.train", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.train", false]], "train() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.train", false], [41, "arlbench.core.algorithms.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.train", false], [42, "arlbench.core.algorithms.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.train", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.ppo method)": [[10, "arlbench.core.algorithms.PPO.train", false], [41, "arlbench.core.algorithms.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo method)": [[17, "arlbench.core.algorithms.ppo.PPO.train", false], [43, "arlbench.core.algorithms.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.train", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.train", false], [41, "arlbench.core.algorithms.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.train", false], [44, "arlbench.core.algorithms.sac.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.train", false], [44, "arlbench.core.algorithms.sac.sac.SAC.train", false]], "train_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false]], "trajectories (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false]], "transition (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition", false]], "transition (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition", false]], "transition (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.Transition", false], [44, "arlbench.core.algorithms.sac.sac.Transition", false]], "tuple_concat() (in module arlbench.utils)": [[36, "arlbench.utils.tuple_concat", false], [47, "arlbench.utils.tuple_concat", false]], "tuple_concat() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.tuple_concat", false], [47, "arlbench.utils.common.tuple_concat", false]], "uniform_sample() (in module arlbench.core.algorithms.buffers)": [[12, "arlbench.core.algorithms.buffers.uniform_sample", false], [41, "arlbench.core.algorithms.buffers.uniform_sample", false]], "update() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.update", false], [41, "arlbench.core.algorithms.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.update", false], [42, "arlbench.core.algorithms.dqn.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.update", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.update", false]], "update() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.update", false], [40, "arlbench.core.running_statistics.update", false]], "update_actor() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.update_actor", false], [41, "arlbench.core.algorithms.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.update_actor", false], [44, "arlbench.core.algorithms.sac.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false], [44, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false]], "update_alpha() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.update_alpha", false], [41, "arlbench.core.algorithms.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.update_alpha", false], [44, "arlbench.core.algorithms.sac.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false], [44, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false]], "update_critic() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.update_critic", false], [41, "arlbench.core.algorithms.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.update_critic", false], [44, "arlbench.core.algorithms.sac.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false], [44, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.update_hpo_config", false], [41, "arlbench.core.algorithms.Algorithm.update_hpo_config", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false]], "value (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.value", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.value", false]], "value (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.value", false], [44, "arlbench.core.algorithms.sac.sac.Transition.value", false]], "values() (arlbench.core.algorithms.common.timestep method)": [[13, "arlbench.core.algorithms.common.TimeStep.values", false], [41, "arlbench.core.algorithms.common.TimeStep.values", false]], "wrapper (class in arlbench.core.wrappers)": [[33, "arlbench.core.wrappers.Wrapper", false], [46, "arlbench.core.wrappers.Wrapper", false]], "wrapper (class in arlbench.core.wrappers.wrapper)": [[35, "arlbench.core.wrappers.wrapper.Wrapper", false], [46, "arlbench.core.wrappers.wrapper.Wrapper", false]], "xlandenv (class in arlbench.core.environments.xland_env)": [[31, "arlbench.core.environments.xland_env.XLandEnv", false], [45, "arlbench.core.environments.xland_env.XLandEnv", false]]}, "objects": {"": [[38, 0, 0, "-", "arlbench"]], "arlbench": [[38, 1, 1, "", "AutoRLEnv"], [38, 0, 0, "-", "arlbench"], [39, 0, 0, "-", "autorl"], [40, 0, 0, "-", "core"], [38, 5, 1, "", "run_arlbench"], [47, 0, 0, "-", "utils"]], "arlbench.AutoRLEnv": [[38, 2, 1, "", "ALGORITHMS"], [38, 3, 1, "", "action_space"], [38, 3, 1, "", "checkpoints"], [38, 3, 1, "", "config"], [38, 3, 1, "", "config_space"], [38, 4, 1, "", "eval"], [38, 3, 1, "", "hpo_config"], [38, 3, 1, "", "objectives"], [38, 3, 1, "", "observation_space"], [38, 4, 1, "", "reset"], [38, 4, 1, "", "step"]], "arlbench.arlbench": [[38, 5, 1, "", "run_arlbench"]], "arlbench.autorl": [[39, 1, 1, "", "AutoRLEnv"], [39, 0, 0, "-", "autorl_env"], [39, 0, 0, "-", "checkpointing"], [39, 0, 0, "-", "objectives"], [39, 0, 0, "-", "state_features"]], "arlbench.autorl.AutoRLEnv": [[39, 2, 1, "", "ALGORITHMS"], [39, 3, 1, "", "action_space"], [39, 3, 1, "", "checkpoints"], [39, 3, 1, "", "config"], [39, 3, 1, "", "config_space"], [39, 4, 1, "", "eval"], [39, 3, 1, "", "hpo_config"], [39, 3, 1, "", "objectives"], [39, 3, 1, "", "observation_space"], [39, 4, 1, "", "reset"], [39, 4, 1, "", "step"]], "arlbench.autorl.autorl_env": [[39, 1, 1, "", "AutoRLEnv"]], "arlbench.autorl.autorl_env.AutoRLEnv": [[39, 2, 1, "", "ALGORITHMS"], [39, 3, 1, "", "action_space"], [39, 3, 1, "", "checkpoints"], [39, 3, 1, "", "config"], [39, 3, 1, "", "config_space"], [39, 4, 1, "", "eval"], [39, 3, 1, "", "hpo_config"], [39, 3, 1, "", "objectives"], [39, 3, 1, "", "observation_space"], [39, 4, 1, "", "reset"], [39, 4, 1, "", "step"]], "arlbench.autorl.checkpointing": [[39, 1, 1, "", "Checkpointer"]], "arlbench.autorl.checkpointing.Checkpointer": [[39, 2, 1, "", "MRP_FILE"], [39, 2, 1, "", "NODES_FILE"], [39, 2, 1, "", "SCALARS_FILE"], [39, 4, 1, "", "load"], [39, 4, 1, "", "load_buffer"], [39, 4, 1, "", "save"], [39, 4, 1, "", "save_buffer"]], "arlbench.autorl.objectives": [[39, 1, 1, "", "Emissions"], [39, 1, 1, "", "Objective"], [39, 1, 1, "", "RewardMean"], [39, 1, 1, "", "RewardStd"], [39, 1, 1, "", "Runtime"]], "arlbench.autorl.objectives.Emissions": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Objective": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "__lt__"], [39, 4, 1, "", "__new__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardMean": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardStd": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Runtime": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.state_features": [[39, 1, 1, "", "GradInfo"], [39, 1, 1, "", "StateFeature"]], "arlbench.autorl.state_features.GradInfo": [[39, 2, 1, "", "KEY"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_state_space"]], "arlbench.autorl.state_features.StateFeature": [[39, 2, 1, "", "KEY"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "__new__"], [39, 4, 1, "", "get_state_space"]], "arlbench.core": [[41, 0, 0, "-", "algorithms"], [45, 0, 0, "-", "environments"], [40, 0, 0, "-", "running_statistics"], [46, 0, 0, "-", "wrappers"]], "arlbench.core.algorithms": [[41, 1, 1, "", "Algorithm"], [41, 1, 1, "", "DQN"], [41, 1, 1, "", "PPO"], [41, 1, 1, "", "SAC"], [41, 0, 0, "-", "algorithm"], [41, 0, 0, "-", "buffers"], [41, 0, 0, "-", "common"], [42, 0, 0, "-", "dqn"], [43, 0, 0, "-", "ppo"], [41, 0, 0, "-", "prioritised_item_buffer"], [44, 0, 0, "-", "sac"]], "arlbench.core.algorithms.Algorithm": [[41, 3, 1, "", "action_type"], [41, 4, 1, "", "eval"], [41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.DQN": [[41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update"]], "arlbench.core.algorithms.PPO": [[41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"]], "arlbench.core.algorithms.SAC": [[41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update_actor"], [41, 4, 1, "", "update_alpha"], [41, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.algorithm": [[41, 1, 1, "", "Algorithm"]], "arlbench.core.algorithms.algorithm.Algorithm": [[41, 3, 1, "", "action_type"], [41, 4, 1, "", "eval"], [41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.buffers": [[41, 5, 1, "", "uniform_sample"]], "arlbench.core.algorithms.common": [[41, 1, 1, "", "TimeStep"]], "arlbench.core.algorithms.common.TimeStep": [[41, 2, 1, "", "action"], [41, 2, 1, "", "done"], [41, 4, 1, "", "from_tuple"], [41, 4, 1, "", "items"], [41, 4, 1, "", "keys"], [41, 2, 1, "", "last_obs"], [41, 2, 1, "", "obs"], [41, 4, 1, "", "replace"], [41, 2, 1, "", "reward"], [41, 4, 1, "", "to_tuple"], [41, 4, 1, "", "values"]], "arlbench.core.algorithms.dqn": [[42, 1, 1, "", "DQN"], [42, 1, 1, "", "DQNMetrics"], [42, 1, 1, "", "DQNRunnerState"], [42, 1, 1, "", "DQNState"], [42, 2, 1, "", "DQNTrainReturnT"], [42, 1, 1, "", "DQNTrainingResult"], [42, 0, 0, "-", "dqn"], [42, 0, 0, "-", "models"]], "arlbench.core.algorithms.dqn.DQN": [[42, 4, 1, "", "get_checkpoint_factory"], [42, 4, 1, "", "get_default_hpo_config"], [42, 4, 1, "", "get_default_nas_config"], [42, 4, 1, "", "get_hpo_config_space"], [42, 4, 1, "", "get_hpo_search_space"], [42, 4, 1, "", "get_nas_config_space"], [42, 4, 1, "", "init"], [42, 2, 1, "", "name"], [42, 4, 1, "", "predict"], [42, 4, 1, "", "train"], [42, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.DQNMetrics": [[42, 2, 1, "", "grads"], [42, 2, 1, "", "loss"], [42, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.DQNRunnerState": [[42, 2, 1, "", "env_state"], [42, 2, 1, "", "global_step"], [42, 2, 1, "", "normalizer_state"], [42, 2, 1, "", "obs"], [42, 2, 1, "", "rng"], [42, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.DQNState": [[42, 2, 1, "", "buffer_state"], [42, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.DQNTrainingResult": [[42, 2, 1, "", "eval_rewards"], [42, 2, 1, "", "metrics"], [42, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn": [[42, 1, 1, "", "DQN"], [42, 1, 1, "", "DQNMetrics"], [42, 1, 1, "", "DQNRunnerState"], [42, 1, 1, "", "DQNState"], [42, 1, 1, "", "DQNTrainState"], [42, 1, 1, "", "DQNTrainingResult"], [42, 1, 1, "", "Transition"]], "arlbench.core.algorithms.dqn.dqn.DQN": [[42, 4, 1, "", "get_checkpoint_factory"], [42, 4, 1, "", "get_default_hpo_config"], [42, 4, 1, "", "get_default_nas_config"], [42, 4, 1, "", "get_hpo_config_space"], [42, 4, 1, "", "get_hpo_search_space"], [42, 4, 1, "", "get_nas_config_space"], [42, 4, 1, "", "init"], [42, 2, 1, "", "name"], [42, 4, 1, "", "predict"], [42, 4, 1, "", "train"], [42, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.dqn.DQNMetrics": [[42, 2, 1, "", "grads"], [42, 2, 1, "", "loss"], [42, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.dqn.DQNRunnerState": [[42, 2, 1, "", "env_state"], [42, 2, 1, "", "global_step"], [42, 2, 1, "", "normalizer_state"], [42, 2, 1, "", "obs"], [42, 2, 1, "", "rng"], [42, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.dqn.DQNState": [[42, 2, 1, "", "buffer_state"], [42, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainState": [[42, 4, 1, "", "create_with_opt_state"], [42, 2, 1, "", "opt_state"], [42, 4, 1, "", "replace"], [42, 2, 1, "", "target_params"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult": [[42, 2, 1, "", "eval_rewards"], [42, 2, 1, "", "metrics"], [42, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn.Transition": [[42, 2, 1, "", "action"], [42, 2, 1, "", "done"], [42, 2, 1, "", "info"], [42, 2, 1, "", "obs"], [42, 2, 1, "", "reward"]], "arlbench.core.algorithms.dqn.models": [[42, 1, 1, "", "CNNQ"], [42, 1, 1, "", "MLPQ"]], "arlbench.core.algorithms.dqn.models.CNNQ": [[42, 4, 1, "", "__call__"], [42, 2, 1, "", "action_dim"], [42, 2, 1, "", "activation"], [42, 2, 1, "", "discrete"], [42, 2, 1, "", "hidden_size"], [42, 2, 1, "", "name"], [42, 2, 1, "", "parent"], [42, 2, 1, "", "scope"], [42, 4, 1, "", "setup"]], "arlbench.core.algorithms.dqn.models.MLPQ": [[42, 4, 1, "", "__call__"], [42, 2, 1, "", "action_dim"], [42, 2, 1, "", "activation"], [42, 2, 1, "", "discrete"], [42, 2, 1, "", "hidden_size"], [42, 2, 1, "", "name"], [42, 2, 1, "", "parent"], [42, 2, 1, "", "scope"], [42, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo": [[43, 1, 1, "", "PPO"], [43, 1, 1, "", "PPOMetrics"], [43, 1, 1, "", "PPORunnerState"], [43, 1, 1, "", "PPOState"], [43, 2, 1, "", "PPOTrainReturnT"], [43, 1, 1, "", "PPOTrainingResult"], [43, 0, 0, "-", "models"], [43, 0, 0, "-", "ppo"]], "arlbench.core.algorithms.ppo.PPO": [[43, 4, 1, "", "get_checkpoint_factory"], [43, 4, 1, "", "get_default_hpo_config"], [43, 4, 1, "", "get_default_nas_config"], [43, 4, 1, "", "get_hpo_config_space"], [43, 4, 1, "", "get_hpo_search_space"], [43, 4, 1, "", "get_nas_config_space"], [43, 4, 1, "", "init"], [43, 2, 1, "", "name"], [43, 4, 1, "", "predict"], [43, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.PPOMetrics": [[43, 2, 1, "", "advantages"], [43, 2, 1, "", "grads"], [43, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.PPORunnerState": [[43, 2, 1, "", "cur_rewards"], [43, 2, 1, "", "env_state"], [43, 2, 1, "", "global_step"], [43, 2, 1, "", "normalizer_state"], [43, 2, 1, "", "obs"], [43, 2, 1, "", "return_buffer"], [43, 2, 1, "", "return_buffer_idx"], [43, 2, 1, "", "rng"], [43, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.PPOState": [[43, 2, 1, "", "buffer_state"], [43, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.PPOTrainingResult": [[43, 2, 1, "", "eval_rewards"], [43, 2, 1, "", "metrics"], [43, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.models": [[43, 1, 1, "", "CNNActorCritic"], [43, 1, 1, "", "MLPActorCritic"]], "arlbench.core.algorithms.ppo.models.CNNActorCritic": [[43, 4, 1, "", "__call__"], [43, 2, 1, "", "action_dim"], [43, 2, 1, "", "activation"], [43, 2, 1, "", "discrete"], [43, 2, 1, "", "hidden_size"], [43, 2, 1, "", "name"], [43, 2, 1, "", "parent"], [43, 2, 1, "", "scope"], [43, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.models.MLPActorCritic": [[43, 4, 1, "", "__call__"], [43, 2, 1, "", "action_dim"], [43, 2, 1, "", "activation"], [43, 2, 1, "", "discrete"], [43, 2, 1, "", "hidden_size"], [43, 2, 1, "", "name"], [43, 2, 1, "", "parent"], [43, 2, 1, "", "scope"], [43, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.ppo": [[43, 1, 1, "", "PPO"], [43, 1, 1, "", "PPOMetrics"], [43, 1, 1, "", "PPORunnerState"], [43, 1, 1, "", "PPOState"], [43, 1, 1, "", "PPOTrainState"], [43, 1, 1, "", "PPOTrainingResult"], [43, 1, 1, "", "Transition"]], "arlbench.core.algorithms.ppo.ppo.PPO": [[43, 4, 1, "", "get_checkpoint_factory"], [43, 4, 1, "", "get_default_hpo_config"], [43, 4, 1, "", "get_default_nas_config"], [43, 4, 1, "", "get_hpo_config_space"], [43, 4, 1, "", "get_hpo_search_space"], [43, 4, 1, "", "get_nas_config_space"], [43, 4, 1, "", "init"], [43, 2, 1, "", "name"], [43, 4, 1, "", "predict"], [43, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.ppo.PPOMetrics": [[43, 2, 1, "", "advantages"], [43, 2, 1, "", "grads"], [43, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.ppo.PPORunnerState": [[43, 2, 1, "", "cur_rewards"], [43, 2, 1, "", "env_state"], [43, 2, 1, "", "global_step"], [43, 2, 1, "", "normalizer_state"], [43, 2, 1, "", "obs"], [43, 2, 1, "", "return_buffer"], [43, 2, 1, "", "return_buffer_idx"], [43, 2, 1, "", "rng"], [43, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.ppo.PPOState": [[43, 2, 1, "", "buffer_state"], [43, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainState": [[43, 4, 1, "", "create_with_opt_state"], [43, 2, 1, "", "opt_state"], [43, 4, 1, "", "replace"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult": [[43, 2, 1, "", "eval_rewards"], [43, 2, 1, "", "metrics"], [43, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.ppo.Transition": [[43, 2, 1, "", "action"], [43, 2, 1, "", "done"], [43, 2, 1, "", "info"], [43, 2, 1, "", "log_prob"], [43, 2, 1, "", "obs"], [43, 2, 1, "", "reward"], [43, 2, 1, "", "value"]], "arlbench.core.algorithms.prioritised_item_buffer": [[41, 5, 1, "", "create_prioritised_item_buffer"], [41, 5, 1, "", "make_prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[44, 1, 1, "", "SAC"], [44, 1, 1, "", "SACMetrics"], [44, 1, 1, "", "SACRunnerState"], [44, 1, 1, "", "SACState"], [44, 2, 1, "", "SACTrainReturnT"], [44, 1, 1, "", "SACTrainingResult"], [44, 0, 0, "-", "models"], [44, 0, 0, "-", "sac"]], "arlbench.core.algorithms.sac.SAC": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_actor"], [44, 4, 1, "", "update_alpha"], [44, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.SACMetrics": [[44, 2, 1, "", "actor_grads"], [44, 2, 1, "", "actor_loss"], [44, 2, 1, "", "alpha_loss"], [44, 2, 1, "", "critic_grads"], [44, 2, 1, "", "critic_loss"], [44, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.SACRunnerState": [[44, 2, 1, "", "actor_train_state"], [44, 2, 1, "", "alpha_train_state"], [44, 2, 1, "", "critic_train_state"], [44, 2, 1, "", "env_state"], [44, 2, 1, "", "global_step"], [44, 2, 1, "", "normalizer_state"], [44, 2, 1, "", "obs"], [44, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.SACState": [[44, 2, 1, "", "buffer_state"], [44, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.SACTrainingResult": [[44, 2, 1, "", "eval_rewards"], [44, 2, 1, "", "metrics"], [44, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.models": [[44, 1, 1, "", "AlphaCoef"], [44, 1, 1, "", "SACCNNActor"], [44, 1, 1, "", "SACCNNCritic"], [44, 1, 1, "", "SACMLPActor"], [44, 1, 1, "", "SACMLPCritic"], [44, 1, 1, "", "SACVectorCritic"], [44, 1, 1, "", "TanhTransformedDistribution"]], "arlbench.core.algorithms.sac.models.AlphaCoef": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "alpha_init"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNActor": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "log_std_max"], [44, 2, 1, "", "log_std_min"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNCritic": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPActor": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "log_std_max"], [44, 2, 1, "", "log_std_min"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPCritic": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACVectorCritic": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "critic"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "n_critics"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"]], "arlbench.core.algorithms.sac.models.TanhTransformedDistribution": [[44, 4, 1, "", "mode"]], "arlbench.core.algorithms.sac.sac": [[44, 1, 1, "", "SAC"], [44, 1, 1, "", "SACMetrics"], [44, 1, 1, "", "SACRunnerState"], [44, 1, 1, "", "SACState"], [44, 1, 1, "", "SACTrainState"], [44, 1, 1, "", "SACTrainingResult"], [44, 1, 1, "", "Transition"]], "arlbench.core.algorithms.sac.sac.SAC": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_actor"], [44, 4, 1, "", "update_alpha"], [44, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.sac.SACMetrics": [[44, 2, 1, "", "actor_grads"], [44, 2, 1, "", "actor_loss"], [44, 2, 1, "", "alpha_loss"], [44, 2, 1, "", "critic_grads"], [44, 2, 1, "", "critic_loss"], [44, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.sac.SACRunnerState": [[44, 2, 1, "", "actor_train_state"], [44, 2, 1, "", "alpha_train_state"], [44, 2, 1, "", "critic_train_state"], [44, 2, 1, "", "env_state"], [44, 2, 1, "", "global_step"], [44, 2, 1, "", "normalizer_state"], [44, 2, 1, "", "obs"], [44, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.sac.SACState": [[44, 2, 1, "", "buffer_state"], [44, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.sac.SACTrainState": [[44, 4, 1, "", "create_with_opt_state"], [44, 2, 1, "", "network_state"], [44, 4, 1, "", "replace"], [44, 2, 1, "", "target_params"]], "arlbench.core.algorithms.sac.sac.SACTrainingResult": [[44, 2, 1, "", "eval_rewards"], [44, 2, 1, "", "metrics"], [44, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.sac.Transition": [[44, 2, 1, "", "action"], [44, 2, 1, "", "done"], [44, 2, 1, "", "info"], [44, 2, 1, "", "obs"], [44, 2, 1, "", "reward"], [44, 2, 1, "", "value"]], "arlbench.core.environments": [[45, 1, 1, "", "BraxEnv"], [45, 1, 1, "", "Environment"], [45, 1, 1, "", "EnvpoolEnv"], [45, 1, 1, "", "GymnasiumEnv"], [45, 1, 1, "", "GymnaxEnv"], [45, 0, 0, "-", "autorl_env"], [45, 0, 0, "-", "brax_env"], [45, 0, 0, "-", "envpool_env"], [45, 0, 0, "-", "gymnasium_env"], [45, 0, 0, "-", "gymnax_env"], [45, 5, 1, "", "make_env"], [45, 0, 0, "-", "make_env"], [45, 0, 0, "-", "xland_env"]], "arlbench.core.environments.BraxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.Environment": [[45, 4, 1, "", "action_space"], [45, 3, 1, "", "env_name"], [45, 3, 1, "", "n_envs"], [45, 4, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_actions"], [45, 4, 1, "", "step"]], "arlbench.core.environments.EnvpoolEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.GymnasiumEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.GymnaxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_action"], [45, 4, 1, "", "step"]], "arlbench.core.environments.autorl_env": [[45, 1, 1, "", "Environment"]], "arlbench.core.environments.autorl_env.Environment": [[45, 4, 1, "", "action_space"], [45, 3, 1, "", "env_name"], [45, 3, 1, "", "n_envs"], [45, 4, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_actions"], [45, 4, 1, "", "step"]], "arlbench.core.environments.brax_env": [[45, 1, 1, "", "BraxEnv"]], "arlbench.core.environments.brax_env.BraxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.envpool_env": [[45, 1, 1, "", "EnvpoolEnv"], [45, 5, 1, "", "numpy_to_jax"]], "arlbench.core.environments.envpool_env.EnvpoolEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.gymnasium_env": [[45, 1, 1, "", "GymnasiumEnv"]], "arlbench.core.environments.gymnasium_env.GymnasiumEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.gymnax_env": [[45, 1, 1, "", "GymnaxEnv"]], "arlbench.core.environments.gymnax_env.GymnaxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_action"], [45, 4, 1, "", "step"]], "arlbench.core.environments.make_env": [[45, 5, 1, "", "make_env"]], "arlbench.core.environments.xland_env": [[45, 1, 1, "", "XLandEnv"]], "arlbench.core.environments.xland_env.XLandEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_action"], [45, 4, 1, "", "step"]], "arlbench.core.running_statistics": [[40, 1, 1, "", "NestedMeanStd"], [40, 1, 1, "", "RunningStatisticsState"], [40, 5, 1, "", "denormalize"], [40, 5, 1, "", "init_state"], [40, 5, 1, "", "normalize"], [40, 5, 1, "", "update"]], "arlbench.core.running_statistics.NestedMeanStd": [[40, 2, 1, "", "mean"], [40, 4, 1, "", "replace"], [40, 2, 1, "", "std"]], "arlbench.core.running_statistics.RunningStatisticsState": [[40, 2, 1, "", "count"], [40, 4, 1, "", "replace"], [40, 2, 1, "", "summed_variance"]], "arlbench.core.wrappers": [[46, 1, 1, "", "FlattenObservationWrapper"], [46, 1, 1, "", "Wrapper"], [46, 0, 0, "-", "flatten_observation"], [46, 0, 0, "-", "wrapper"]], "arlbench.core.wrappers.FlattenObservationWrapper": [[46, 3, 1, "", "observation_space"], [46, 4, 1, "", "reset"], [46, 4, 1, "", "step"]], "arlbench.core.wrappers.flatten_observation": [[46, 1, 1, "", "FlattenObservationWrapper"]], "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper": [[46, 3, 1, "", "observation_space"], [46, 4, 1, "", "reset"], [46, 4, 1, "", "step"]], "arlbench.core.wrappers.wrapper": [[46, 1, 1, "", "Wrapper"]], "arlbench.utils": [[47, 0, 0, "-", "common"], [47, 5, 1, "", "config_space_to_gymnasium_space"], [47, 5, 1, "", "config_space_to_yaml"], [47, 5, 1, "", "gymnasium_space_to_gymnax_space"], [47, 5, 1, "", "recursive_concat"], [47, 5, 1, "", "save_defaults_to_yaml"], [47, 5, 1, "", "tuple_concat"]], "arlbench.utils.common": [[47, 5, 1, "", "config_space_to_gymnasium_space"], [47, 5, 1, "", "config_space_to_yaml"], [47, 5, 1, "", "gymnasium_space_to_gymnax_space"], [47, 5, 1, "", "recursive_concat"], [47, 5, 1, "", "save_defaults_to_yaml"], [47, 5, 1, "", "tuple_concat"]]}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "property", "Python property"], "4": ["py", "method", "Python method"], "5": ["py", "function", "Python function"]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:attribute", "3": "py:property", "4": "py:method", "5": "py:function"}, "terms": {"": [2, 3, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 38, 41, 42, 43, 44, 49], "0": [14, 15, 17, 19, 20, 21, 22, 23, 24, 30, 32, 36, 37, 39, 40, 41, 42, 43, 44, 45, 47], "06": [32, 40], "1": [14, 15, 17, 19, 21, 22, 23, 24, 30, 39, 42, 43, 44, 45, 49], "10": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "100": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "1000000": [10, 11, 14, 15, 17, 19, 21, 23, 32, 40, 41, 42, 43, 44], "1e": [32, 40], "2": [14, 15, 17, 19, 21, 22, 23, 32, 39, 40, 42, 43, 44, 49], "20": [22, 44], "24": [32, 40], "3": [14, 15, 17, 19, 21, 23, 42, 43, 44], "31": [32, 40], "4": [14, 15, 17, 19, 21, 23, 42, 43, 44], "5": [14, 15, 17, 19, 21, 23, 42, 43, 44], "512": [16, 18, 22, 42, 43, 44], "6": [17, 19, 20, 21, 23, 41, 43, 44], "64": [16, 18, 22, 42, 43, 44], "64bit": [32, 40], "7": [17, 19, 21, 23, 43, 44], "8": [17, 19, 43], "A": [13, 16, 18, 22, 24, 26, 28, 29, 31, 32, 40, 41, 42, 43, 44, 45, 52], "As": [17, 19, 24, 25, 43, 45], "If": [2, 4, 5, 20, 32, 38, 39, 40, 41], "In": [2, 4, 5, 38, 39], "It": [7, 8, 39], "Not": [10, 14, 15, 21, 23, 41, 42, 44], "The": [6, 10, 11, 16, 18, 20, 22, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 52], "These": [24, 25, 45], "To": [32, 40], "With": [2, 4, 5, 38, 39], "_": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44, 45], "__call__": [7, 8, 16, 18, 22, 38, 39, 41, 42, 43, 44], "__init__": [16, 18, 22, 42, 43, 44], "__lt__": [7, 38, 39], "__new__": [7, 8, 38, 39], "__setattr__": [16, 18, 22, 42, 43, 44], "_description_": [2, 4, 5, 10, 21, 23, 24, 25, 30, 36, 37, 38, 39, 41, 44, 45, 47], "_imag": [32, 40], "_sentinel": [16, 18, 22, 42, 43, 44], "_summary_": [10, 21, 23, 41, 44], "_type_": [36, 37, 47], "abc": [7, 8, 10, 11, 24, 25, 39, 41, 45], "abstract": [7, 8, 10, 11, 24, 25, 39, 41, 45], "access": [16, 18, 22, 42, 43, 44], "accumul": [32, 40], "acm": [32, 40], "across": [17, 19, 43], "act": [20, 41], "action": [2, 4, 5, 10, 11, 13, 14, 15, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46], "action_dim": [16, 18, 22, 41, 42, 43, 44], "action_s": [10, 11, 41], "action_spac": [2, 4, 5, 24, 25, 26, 27, 28, 29, 31, 38, 39, 40, 45, 55], "action_typ": [10, 11, 40, 41], "activ": [16, 18, 22, 41, 42, 43, 44], "actor": [10, 18, 21, 22, 23, 41, 43, 44, 52], "actor_grad": [21, 23, 41, 44], "actor_loss": [10, 21, 23, 41, 44], "actor_network_param": [10, 21, 23, 41, 44], "actor_opt_st": [10, 21, 23, 41, 44], "actor_train_st": [10, 21, 23, 41, 44], "actual": [24, 25, 45], "ad": [20, 41], "adapt": [10, 11, 12, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "add": [20, 41], "add_batch": [20, 41], "add_sequ": [20, 41], "addit": [2, 4, 5, 38, 39], "advantag": [7, 8, 17, 19, 39, 41, 43], "after": [32, 40], "agent": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "algorithm": [2, 4, 5, 6, 24, 25, 36, 37, 38, 39, 40, 45, 47, 52, 55], "algorithm_kw_arg": [6, 39], "algorithm_st": [6, 10, 11, 39, 41], "algorithmst": [6, 39], "alia": [14, 15, 17, 19, 21, 23, 42, 43, 44], "all": [6, 10, 11, 14, 15, 17, 19, 21, 23, 32, 39, 40, 41, 42, 43, 44], "allow": [7, 8, 39], "alpha": [10, 20, 21, 22, 23, 41, 44], "alpha_init": [22, 41, 44], "alpha_loss": [10, 21, 23, 41, 44], "alpha_network_param": [10, 21, 23, 41, 44], "alpha_opt_st": [10, 21, 23, 41, 44], "alpha_train_st": [10, 21, 23, 41, 44], "alphacoef": [22, 41, 44], "alwai": [17, 19, 43], "among": [10, 11, 41], "an": [6, 7, 8, 13, 16, 18, 20, 22, 24, 25, 27, 32, 39, 40, 41, 42, 43, 44, 45, 49, 52], "ani": [6, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 30, 32, 33, 34, 39, 40, 41, 42, 43, 44, 45, 46], "anoth": [16, 18, 22, 42, 43, 44, 49], "answer": 51, "append": [6, 39], "appli": [16, 18, 22, 42, 43, 44, 52], "apply_fn": [15, 19, 23, 42, 43, 44], "approxim": 52, "ar": [6, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 32, 33, 34, 39, 40, 41, 42, 43, 44, 46], "architectur": [10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 41, 42, 43, 44, 47], "arg": [7, 8, 22, 39, 44], "argument": [24, 30, 45], "around": [7, 8, 39], "arrai": [2, 4, 5, 14, 15, 17, 19, 21, 22, 23, 24, 25, 27, 32, 38, 39, 40, 41, 42, 43, 44, 45], "assign": [16, 18, 22, 42, 43, 44], "attribut": [6, 16, 18, 22, 39, 42, 43, 44], "autom": [2, 4, 5, 38, 39, 52], "automl": [49, 52], "autorl": [2, 38, 52, 55], "autorl_config": [6, 39], "autorl_env": [38, 40, 55], "autorlenv": [2, 4, 5, 38, 39, 55], "axi": [32, 36, 37, 40, 47], "base": [2, 4, 5, 6, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 44, 45, 46], "baselines3": [18, 22, 43, 44], "basic": [7, 8, 10, 11, 39, 41], "batch": [10, 12, 14, 15, 20, 21, 23, 32, 40, 41, 42, 44], "batch_siz": [12, 41], "bayesian": 52, "befor": [2, 4, 5, 16, 18, 22, 32, 38, 39, 40, 42, 43, 44], "behaviour": [7, 8, 39], "being": [16, 18, 20, 22, 41, 42, 43, 44], "best": 52, "between": [7, 12, 39, 41], "black": 52, "blob": [18, 22, 32, 40, 43, 44], "bo": [49, 52], "bool": [2, 4, 5, 6, 7, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 32, 38, 39, 40, 41, 42, 43, 44, 45], "bool_": [17, 19, 21, 23, 41, 43, 44, 45], "both": [24, 25, 45], "bound": [16, 18, 22, 42, 43, 44], "box": [33, 34, 46, 52], "brax": [24, 26, 30, 45], "brax_env": [38, 40], "braxenv": [24, 26, 40, 45], "buffer": [6, 10, 11, 14, 15, 17, 19, 20, 38, 39, 40, 42, 43], "buffer_dir": [6, 39], "buffer_st": [6, 10, 11, 14, 15, 17, 19, 21, 23, 39, 41, 42, 43, 44], "c_episod": [6, 39], "c_step": [6, 39], "calcul": [7, 8, 22, 39, 44], "call": [2, 4, 5, 7, 8, 16, 18, 20, 22, 33, 34, 38, 39, 41, 42, 43, 44, 46], "callabl": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "can": [7, 8, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 39, 41, 42, 43, 44, 52], "captur": [13, 41], "carbon": [7, 39], "case": [16, 18, 22, 42, 43, 44], "caus": [16, 18, 22, 42, 43, 44], "certain": [6, 39], "cfg": [2, 3, 38], "checkpoint": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 41, 42, 43, 44, 55], "checkpoint_dir": [6, 39], "checkpoint_nam": [6, 39], "checkpoint_path": [2, 4, 5, 6, 38, 39], "chex": [10, 11, 12, 14, 15, 17, 19, 21, 23, 33, 34, 41, 42, 43, 44, 46], "chosen": [20, 41], "cl": [7, 8, 39], "class": [2, 4, 5, 6, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 44, 45, 46], "classmethod": [42, 43, 44], "clip": 52, "cnn": [16, 18, 22, 42, 43, 44], "cnn_polici": [10, 14, 15, 17, 19, 21, 23, 24, 30, 31, 41, 42, 43, 44, 45], "cnnactorcrit": [18, 41, 43], "cnnq": [16, 41, 42], "code": [7, 39, 49], "coeffici": [22, 44], "com": [18, 22, 32, 40, 43, 44], "common": [6, 18, 22, 38, 39, 40, 43, 44, 55], "common_gotchas_in_jax": [32, 40], "compact": [16, 18, 22, 42, 43, 44], "compar": [7, 39], "comparison": [7, 39], "compat": [24, 30, 45], "comput": [32, 40], "concat": [36, 37, 47], "concaten": [36, 37, 47], "config": [2, 3, 4, 5, 38, 39, 55], "config_kei": [36, 37, 47], "config_spac": [2, 4, 5, 36, 37, 38, 39, 47, 55], "config_space_to_gymnasium_spac": [36, 37, 38, 47], "config_space_to_yaml": [36, 37, 38, 47], "configspac": [2, 4, 5, 36, 37, 38, 39, 47], "configur": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 38, 39, 41, 42, 43, 44, 47], "configurationspac": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 38, 39, 41, 42, 43, 44, 47], "consid": [32, 40], "consist": [14, 15, 17, 19, 21, 23, 42, 43, 44], "construct": [0, 16, 18, 22, 42, 43, 44, 48, 51, 54], "contain": [6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 32, 39, 40, 41, 42, 43, 44, 45], "content": 55, "conv": [16, 18, 22, 42, 43, 44], "conv1": [16, 18, 22, 42, 43, 44], "converst": [36, 37, 47], "convert": [27, 36, 37, 45, 47], "core": [38, 39, 55], "correspond": [32, 40], "count": [32, 38, 40], "cpu": [20, 41], "creat": [2, 4, 5, 7, 8, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 38, 39, 41, 42, 43, 44, 45], "create_prioritised_item_buff": [20, 40, 41], "create_with_opt_st": [41, 42, 43, 44], "critic": [10, 18, 21, 22, 23, 41, 43, 44, 52], "critic_grad": [21, 23, 41, 44], "critic_loss": [10, 21, 23, 41, 44], "critic_network_param": [10, 21, 23, 41, 44], "critic_opt_st": [10, 21, 23, 41, 44], "critic_target_param": [10, 21, 23, 41, 44], "critic_train_st": [10, 21, 23, 41, 44], "cumul": [10, 11, 41], "cur_reward": [17, 19, 41, 43], "current": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "d": [13, 41], "data": [6, 20, 32, 39, 40, 41], "deep": [10, 14, 15, 41, 42, 52], "deepmind": [32, 40], "def": [16, 18, 22, 42, 43, 44], "default": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 32, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47], "defin": [10, 11, 16, 18, 22, 41, 42, 43, 44], "degrad": [32, 40], "denorm": [32, 38, 40], "depend": [20, 32, 40, 41], "determinist": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "deterministic_ev": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "deviat": [7, 32, 39, 40], "devic": [20, 41], "dict": [2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 24, 30, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47], "dict1": [36, 37, 47], "dict2": [36, 37, 47], "dictionari": [6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 39, 41, 42, 43, 44, 47], "differ": [10, 11, 41, 52], "dimens": [32, 40], "directli": [7, 8, 39], "directori": [6, 39], "discret": [10, 11, 16, 18, 41, 42, 43], "disk": [6, 39], "distrax": [22, 44], "distribut": [22, 44], "dlr": [18, 22, 43, 44], "do": [7, 8, 39], "doc": [32, 40], "doe": [16, 17, 18, 19, 22, 42, 43, 44], "doesn": [32, 40], "dolor": 53, "done": [6, 7, 8, 10, 13, 14, 15, 19, 23, 39, 40, 41, 42, 43, 44, 52], "doubl": [32, 40], "dqn": [10, 21, 23, 38, 39, 40, 41, 44, 52], "dqnmetric": [14, 15, 41, 42], "dqnrunnerst": [10, 14, 15, 41, 42], "dqnstate": [10, 14, 15, 41, 42], "dqntrainingresult": [10, 14, 15, 41, 42], "dqntrainreturnt": [10, 14, 15, 41, 42], "dqntrainstat": [10, 14, 15, 41, 42], "dtype": [32, 40], "dummi": [6, 39], "dummy_buffer_st": [6, 39], "dure": [2, 4, 5, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "dynam": [32, 40], "each": [2, 4, 5, 20, 24, 25, 38, 39, 41, 45], "earlier": [32, 40], "either": [16, 18, 22, 42, 43, 44], "element": [32, 36, 37, 40, 47], "emiss": [7, 38, 39], "empti": [2, 4, 5, 38, 39], "en": [32, 40], "enabl": [32, 40], "entropi": [10, 21, 23, 41, 44, 52], "env": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 35, 38, 39, 41, 42, 43, 44, 45, 46], "env_framework": [24, 30, 45], "env_kwarg": [24, 26, 27, 28, 29, 30, 31, 45], "env_nam": [24, 25, 26, 27, 28, 29, 30, 31, 40, 45], "env_stat": [14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "environ": [2, 4, 5, 6, 7, 8, 10, 11, 13, 33, 34, 38, 39, 40, 41, 46, 52], "envpool": [24, 27, 30, 45], "envpool_env": [38, 40], "envpoolenv": [24, 27, 40, 45], "episod": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "equival": [20, 24, 30, 32, 40, 41, 45], "error": [2, 4, 5, 38, 39], "etc": [24, 30, 32, 40, 45], "eval": [2, 4, 5, 10, 11, 38, 39, 40, 41, 55], "eval_env": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "eval_reward": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "evalu": [2, 4, 5, 7, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "evalut": [2, 4, 5, 38, 39], "even": [32, 40], "experi": [10, 12, 21, 23, 41, 44], "exploit": 52, "explor": 52, "expon": [20, 41], "extract": [36, 37, 47], "factori": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "fals": [10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 31, 41, 42, 43, 44, 45], "featur": [2, 4, 5, 8, 38, 39], "fidel": 52, "field": [14, 15, 17, 19, 21, 23, 32, 40, 42, 43, 44], "file": [32, 36, 37, 40, 47], "final": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "find": 52, "first": [7, 8, 36, 37, 39, 47, 51], "fit": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "flatten": [33, 34, 46], "flatten_observ": [38, 40], "flattenobservationwrapp": [33, 34, 40, 46], "flax": [16, 18, 22, 42, 43, 44], "float": [2, 3, 20, 32, 38, 40, 41, 44], "float32": [32, 40], "follow": [16, 18, 22, 24, 25, 30, 42, 43, 44, 45], "framework": [24, 30, 45], "from": [6, 32, 39, 40, 52], "from_tupl": [40, 41], "frozendict": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "full": [32, 40], "fulli": [24, 25, 45], "function": [3, 7, 8, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 32, 33, 34, 37, 39, 40, 41, 42, 43, 44, 45, 46, 52], "gener": [10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "get_checkpoint_factori": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_default_hpo_config": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_default_nas_config": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_hpo_config_spac": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_hpo_search_spac": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_nas_config_spac": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_spec": [7, 38, 39], "get_state_spac": [8, 38, 39], "github": [18, 22, 32, 40, 43, 44], "give": [16, 18, 22, 42, 43, 44], "given": [2, 3, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 32, 33, 34, 38, 40, 41, 42, 43, 44, 45, 46, 52], "global_step": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "glossari": 49, "gpu": [20, 41], "grad": [8, 10, 14, 15, 17, 19, 39, 41, 42, 43], "grad_info": 39, "gradient": [8, 39, 52], "gradinfo": [8, 38, 39], "gymnasium": [2, 4, 5, 24, 25, 28, 30, 36, 37, 38, 39, 45, 47], "gymnasium_env": [38, 40], "gymnasium_space_to_gymnax_spac": [36, 37, 38, 47], "gymnasiumenv": [24, 28, 40, 45], "gymnax": [24, 25, 26, 27, 28, 29, 30, 31, 36, 37, 45, 47], "gymnax_env": [38, 40], "gymnax_spac": [36, 37, 47], "gymnaxenv": [24, 29, 40, 45], "gynasium": [2, 4, 5, 38, 39], "gynmasium": [2, 4, 5, 38, 39], "ha": [24, 30, 45], "happen": [16, 18, 22, 42, 43, 44], "have": [32, 40], "hello": 49, "here": [16, 18, 22, 42, 43, 44, 49, 51], "hidden_s": [16, 18, 22, 41, 42, 43, 44], "hierarchi": [32, 40], "howev": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "hp_config": [6, 36, 37, 39, 47], "hp_config_spac": [36, 37, 47], "hpo": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44, 52], "hpo_config": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44, 55], "html": [32, 40], "http": [18, 22, 32, 40, 43, 44, 49], "hyperparamet": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 38, 39, 41, 42, 43, 44, 47, 52], "i": [0, 2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 38, 39, 41, 42, 43, 44, 48, 49, 51, 54], "id": [6, 24, 25, 30, 39, 45], "identifi": [6, 39], "imit": [7, 8, 39], "immedi": [16, 18, 22, 42, 43, 44], "impact": [32, 40], "implement": [7, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 39, 41, 42, 43, 44, 45], "improv": [32, 40, 52], "includ": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "independ": [20, 41], "inexact": [32, 40], "info": [15, 19, 23, 41, 42, 43, 44], "inform": [2, 4, 5, 8, 38, 39], "infot": [2, 4, 5, 38, 39], "init": [10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 40, 41, 42, 43, 44], "init_and_output": [16, 18, 22, 42, 43, 44], "init_st": [32, 38, 40], "initi": [2, 4, 5, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 32, 38, 39, 40, 41, 42, 43, 44], "insid": [16, 18, 22, 42, 43, 44], "instal": 49, "instanc": [7, 8, 16, 18, 22, 39, 42, 43, 44], "int": [2, 4, 5, 6, 10, 11, 12, 14, 15, 17, 19, 20, 21, 23, 24, 25, 30, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47], "int32": [32, 40], "integ": [32, 40], "interact": [13, 41], "intern": [24, 25, 33, 34, 45, 46], "interv": [12, 41], "invok": [16, 18, 22, 42, 43, 44], "io": [32, 40], "ipsum": 53, "is_weight": [10, 14, 15, 21, 23, 41, 42, 44], "item": [13, 20, 40, 41, 49], "iter": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "its": [2, 4, 5, 33, 34, 38, 39, 46, 52], "jax": [10, 14, 15, 17, 19, 21, 23, 24, 25, 27, 30, 32, 40, 41, 42, 43, 44, 45], "jax_enable_x64": [32, 40], "jit": [32, 40], "jittabl": [24, 25, 45], "jnp": [10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 32, 33, 34, 40, 41, 42, 43, 44, 45, 46], "json": 39, "keep": [7, 8, 39], "kei": [10, 11, 12, 13, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "kept": [17, 19, 43], "keyword": [24, 30, 45], "kind": [24, 25, 45], "know": [6, 39], "kwarg": [7, 8, 22, 39, 41, 42, 43, 44], "l48": [18, 22, 43, 44], "larg": [32, 40], "last": [6, 7, 39], "last_ob": [13, 40, 41], "latest": [32, 40], "lazi": [16, 18, 22, 42, 43, 44], "lazili": [16, 18, 22, 42, 43, 44], "learn": [2, 4, 5, 10, 11, 38, 39, 41, 52], "leav": [32, 40], "length": [12, 20, 41], "less": [7, 39], "let": 49, "level": [2, 38, 52], "like": [2, 4, 5, 13, 16, 18, 22, 38, 39, 41, 42, 43, 44], "line": [16, 18, 22, 42, 43, 44], "linen": [16, 18, 22, 42, 43, 44], "link": 49, "list": [2, 3, 4, 5, 38, 39, 49], "load": [6, 38, 39], "load_buff": [6, 38, 39], "log_prob": [19, 41, 43], "log_std_max": [22, 41, 44], "log_std_min": [22, 41, 44], "logger": [2, 3, 38], "lorem": 53, "loss": [10, 14, 15, 17, 19, 41, 42, 43], "machin": 52, "make": [20, 41], "make_env": [24, 38, 40], "make_prioritised_item_buff": [20, 40, 41], "map": [13, 41], "master": [18, 22, 32, 40, 43, 44], "match": [24, 30, 32, 40, 45], "max_abs_valu": [32, 40], "max_length": [20, 41], "max_recorded_prior": 39, "maxim": [7, 39], "maximum": [20, 32, 40, 41, 52], "mean": [7, 32, 38, 39, 40], "mean_std": [32, 40], "measur": [7, 39], "method": [6, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 39, 41, 42, 43, 44, 45, 52], "metric": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "min_length": [20, 41], "minim": [7, 39], "minimum": [20, 32, 40, 41, 52], "mlp": [16, 18, 22, 42, 43, 44], "mlpactorcrit": [18, 41, 43], "mlpq": [16, 41, 42], "mode": [22, 41, 44, 49], "model": [40, 41, 52], "modifi": [32, 40], "modul": [2, 4, 9, 10, 14, 16, 17, 18, 21, 22, 24, 33, 36, 55], "more": [20, 41], "mrp_file": [38, 39], "multi": 52, "multipl": 52, "must": [24, 30, 32, 40, 45], "mymodul": [16, 18, 22, 42, 43, 44], "n_critic": [22, 41, 44], "n_env": [10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 26, 27, 29, 30, 31, 40, 41, 42, 43, 44, 45], "n_eval_episod": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "n_eval_step": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "n_total_timestep": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "name": [6, 16, 18, 22, 24, 25, 30, 32, 36, 37, 39, 40, 41, 42, 43, 44, 45, 47], "namedtupl": [14, 15, 17, 19, 21, 23, 42, 43, 44], "nas_config": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "nas_config_sapc": [36, 37, 47], "naturecnn": [18, 22, 43, 44], "ndarrai": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46], "need": [24, 25, 45], "nest": [32, 40], "nestedmeanstd": [32, 38, 40], "network": [10, 14, 15, 16, 17, 18, 19, 21, 22, 23, 41, 42, 43, 44, 52], "network_param": [10, 14, 15, 17, 19, 41, 42, 43], "network_st": [41, 44], "neural": [10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 41, 42, 43, 44, 47, 52], "new": [7, 8, 15, 19, 23, 32, 39, 40, 42, 43, 44], "next": [10, 14, 15, 41, 42], "next_observ": [10, 14, 15, 41, 42], "nn": [16, 18, 22, 42, 43, 44], "node": 39, "nodes_fil": [38, 39], "none": [2, 3, 4, 5, 6, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47], "norm": [8, 39], "normal": [32, 38, 40], "normalizer_st": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "note": [17, 19, 24, 25, 32, 40, 43, 45, 49], "notebook": [32, 40], "now": [16, 18, 22, 42, 43, 44], "np": [2, 4, 5, 38, 39], "npy": 39, "num_eval_episod": [2, 4, 5, 10, 11, 38, 39, 41], "number": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 30, 33, 34, 38, 39, 41, 42, 43, 44, 45, 46], "numpi": [27, 32, 40, 45], "numpy_to_jax": [27, 40, 45], "ob": [10, 11, 13, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "object": [2, 3, 4, 5, 6, 8, 13, 15, 16, 18, 19, 22, 23, 32, 33, 35, 36, 37, 38, 40, 41, 42, 43, 44, 46, 47, 52, 55], "objectivest": [2, 4, 5, 38, 39], "objectv": [7, 39], "obser": [33, 34, 46], "observ": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 41, 42, 43, 44, 45, 46], "observation_spac": [2, 4, 5, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 40, 45, 46, 55], "observationt": [2, 4, 5, 38, 39], "off": 52, "onc": [16, 18, 22, 42, 43, 44], "one": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 30, 38, 39, 41, 42, 43, 44, 45], "onli": [17, 19, 32, 40, 43], "oper": [20, 41], "opt_stat": [10, 14, 15, 17, 19, 23, 41, 42, 43, 44], "optax": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "optim": [7, 10, 14, 15, 17, 19, 20, 21, 23, 39, 41, 42, 43, 44, 52], "optimize_object": [7, 39], "option": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47], "optstat": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "order": 49, "org": [32, 40, 49], "other": [7, 10, 14, 15, 16, 17, 18, 19, 21, 22, 23, 39, 41, 42, 43, 44], "output": 49, "overflow": [32, 40], "overrid": [7, 8, 39], "overriden": [6, 39], "packag": [2, 55], "page": [0, 48, 49, 51, 54], "paper": [20, 41], "param": [10, 14, 15, 17, 19, 23, 41, 42, 43, 44], "paramet": [2, 4, 5, 6, 7, 8, 10, 11, 12, 14, 15, 17, 19, 20, 21, 23, 24, 25, 30, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "parent": [16, 18, 22, 41, 42, 43, 44], "part": [6, 39], "pass": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 30, 32, 38, 39, 40, 41, 42, 43, 44, 45], "path": [2, 4, 5, 6, 38, 39], "per": [2, 4, 5, 10, 11, 14, 15, 17, 19, 20, 21, 23, 38, 39, 41, 42, 43, 44], "perform": [2, 4, 5, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 25, 32, 38, 39, 40, 41, 42, 43, 44, 45], "period": [12, 41], "pmap": [32, 40], "pmap_axis_nam": [32, 40], "png": [32, 40], "point": [32, 40], "polici": [10, 17, 19, 41, 43, 52], "possibl": [10, 11, 41], "possibli": [32, 40], "posssibl": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "ppo": [10, 21, 22, 23, 38, 39, 40, 41, 44, 52], "ppometr": [17, 19, 41, 43], "pporunnerst": [10, 17, 19, 41, 43], "ppostat": [10, 17, 19, 41, 43], "ppotrainingresult": [10, 17, 19, 41, 43], "ppotrainreturnt": [10, 17, 19, 41, 43], "ppotrainst": [17, 19, 41, 43], "precis": [32, 40], "predefin": 52, "predict": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "principl": 52, "print": 49, "prioriti": [6, 20, 39, 41], "prioritis": [20, 41], "prioritised_item_buff": [38, 40], "prioritisedtrajectorybuff": [20, 41], "prioritisedtrajectorybufferst": [6, 10, 12, 14, 15, 21, 23, 39, 41, 42, 44], "priority_expon": [20, 41], "priority_state_path": [6, 39], "prioriz": [12, 41], "prngkei": [10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "problem": 52, "process": 52, "product": 49, "properti": [2, 4, 5, 10, 11, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 41, 45, 46], "provid": [13, 41], "proxim": [10, 17, 19, 41, 43, 52], "py": [18, 22, 32, 40, 43, 44], "q": [10, 14, 15, 16, 41, 42, 52], "rais": [2, 4, 5, 38, 39], "random": [2, 4, 5, 10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 30, 33, 34, 38, 39, 41, 42, 43, 44, 45, 46, 52], "randomli": 52, "rang": [32, 40], "rank": [7, 38, 39], "re": [2, 4, 5, 38, 39], "readthedoc": [32, 40], "real": 52, "recurs": [36, 37, 47], "recursive_concat": [36, 37, 38, 47], "refer": 49, "reinforc": [2, 4, 5, 10, 11, 38, 39, 41, 52], "relat": [6, 39], "remov": 49, "replac": [15, 19, 23, 32, 38, 40, 41, 42, 43, 44], "requir": [6, 39], "reset": [2, 4, 5, 24, 25, 33, 34, 38, 39, 40, 45, 46, 55], "restor": [6, 39], "result": [6, 10, 11, 14, 15, 17, 19, 21, 23, 32, 33, 34, 39, 40, 41, 42, 43, 44, 46], "return": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 14, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "return_buff": [17, 19, 41, 43], "return_buffer_idx": [17, 19, 41, 43], "reward": [7, 10, 11, 13, 14, 15, 19, 23, 39, 40, 41, 42, 43, 44], "reward_mean": 39, "reward_std": 39, "rewardmean": [7, 38, 39], "rewardstd": [7, 38, 39], "rl": [2, 4, 5, 24, 25, 26, 27, 28, 29, 30, 31, 38, 39, 45], "rm": [18, 22, 43, 44], "rng": [10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "rng_kei": [12, 41], "run": [2, 3, 4, 5, 32, 38, 39, 40], "run_arlbench": [2, 3, 38, 55], "runner": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "runner_st": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "running_statist": [38, 55], "runningstatisticsst": [14, 15, 17, 19, 21, 23, 32, 38, 40, 42, 43, 44], "runtim": [7, 38, 39], "sac": [10, 38, 39, 40, 41, 52], "saccnnactor": [22, 41, 44], "saccnncrit": [22, 41, 44], "sacmetr": [21, 23, 41, 44], "sacmlpactor": [22, 41, 44], "sacmlpcrit": [22, 41, 44], "sacrunnerst": [10, 21, 23, 41, 44], "sacstat": [10, 21, 23, 41, 44], "sactrainingresult": [10, 21, 23, 41, 44], "sactrainreturnt": [10, 21, 23, 41, 44], "sactrainst": [10, 21, 23, 41, 44], "sacvectorcrit": [22, 41, 44], "safe": [16, 18, 22, 42, 43, 44], "same": [32, 36, 37, 40, 47], "sampl": [10, 11, 12, 14, 15, 17, 19, 20, 21, 23, 24, 25, 41, 42, 43, 44, 45, 52], "sample_act": [24, 25, 40, 45], "sample_batch_s": [20, 41], "save": [6, 38, 39], "save_buff": [6, 38, 39], "save_defaults_to_yaml": [36, 37, 38, 47], "scalar": 39, "scalars_fil": [38, 39], "scope": [41, 42, 43, 44], "search": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44, 52], "second": [36, 37, 47], "see": [16, 18, 22, 32, 40, 42, 43, 44], "seed": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 27, 28, 30, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47], "self": [7, 8, 16, 18, 22, 39, 42, 43, 44], "sequenc": [12, 20, 41], "sequence_length": [12, 41], "set": [13, 32, 40, 41], "setup": [16, 18, 22, 41, 42, 43, 44], "shape": [10, 11, 32, 40, 41], "share": [10, 11, 41], "should": [32, 40], "similar": [16, 18, 22, 42, 43, 44], "simplifi": [32, 40], "singl": [6, 20, 39, 41], "size": [6, 10, 11, 12, 20, 39, 41], "soft": [10, 21, 23, 41, 44, 52], "some": 49, "sort": [7, 39], "sourc": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "space": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 52], "specif": [7, 8, 39], "specifi": [15, 19, 23, 32, 40, 42, 43, 44], "stabil": 52, "stabl": [18, 22, 32, 40, 43, 44], "stable_baselines3": [18, 22, 43, 44], "standard": [7, 32, 39, 40], "state": [2, 4, 5, 6, 8, 10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46], "state_featur": [38, 55], "statefeatur": [8, 38, 39], "static": [6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 39, 41, 42, 43, 44], "statist": [32, 40], "std": [32, 38, 40], "std_max_valu": [32, 40], "std_min_valu": [32, 40], "step": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46, 49, 55], "store": [6, 7, 8, 39], "str": [2, 4, 5, 6, 7, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 25, 30, 32, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47], "string": [36, 37, 47], "structur": [32, 40], "sub": [24, 25, 45], "submodul": [16, 18, 22, 55], "subpackag": 55, "subsequ": [7, 8, 39], "summed_vari": [32, 38, 40], "support": [12, 24, 25, 41, 45], "surrog": 52, "t": [32, 40], "tag": [6, 39], "take": [24, 25, 33, 34, 45, 46], "taken": [32, 40], "tanh": [16, 18, 22, 42, 43, 44], "tanhtransformeddistribut": [22, 41, 44], "target": [10, 14, 15, 21, 23, 41, 42, 44], "target_param": [10, 14, 15, 23, 41, 42, 44], "td_error": [10, 14, 15, 21, 23, 41, 42, 44], "term": 49, "termin": [2, 4, 5, 38, 39], "than": [7, 39], "thi": [0, 2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 32, 38, 39, 40, 41, 42, 43, 44, 48, 49, 51, 52, 54], "three": [16, 18, 22, 42, 43, 44], "time": [20, 41], "timestep": [10, 11, 13, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "to_tupl": [40, 41], "top": [2, 38], "torch_lay": [18, 22, 43, 44], "total": [2, 4, 5, 7, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "tpu": [20, 41], "track_metr": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "track_trajectori": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "train": [2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 40, 41, 42, 43, 44], "train_func": [7, 8, 39], "train_result": [6, 10, 11, 14, 15, 17, 19, 21, 23, 39, 41, 42, 43, 44], "train_stat": [10, 14, 15, 17, 19, 41, 42, 43], "trainfunc": [7, 8, 39], "training_result": [10, 11, 41], "trainresult": [6, 39], "trainstat": [15, 19, 23, 42, 43, 44], "trajectori": [10, 12, 14, 15, 17, 19, 20, 21, 23, 41, 42, 43, 44], "trajectorybufferst": [6, 39], "transform": [22, 44], "transit": [10, 14, 15, 17, 19, 20, 21, 23, 41, 42, 43, 44], "transitionsampl": [12, 41], "true": [10, 11, 14, 15, 16, 17, 18, 19, 21, 23, 32, 40, 41, 42, 43, 44], "truncat": [2, 4, 5, 38, 39], "tupl": [2, 3, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47], "tuple1": [36, 37, 47], "tuple2": [36, 37, 47], "tuple_concat": [36, 37, 38, 47], "twice": [32, 40], "two": [7, 36, 37, 39, 47], "tx": [15, 19, 23, 42, 43, 44], "type": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 14, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "u": [7, 8, 39], "under": [0, 48, 51, 54], "uniform": [12, 41], "uniform_sampl": [12, 40, 41], "union": [17, 19, 21, 23, 41, 42, 43, 44, 45], "uniqu": [6, 39], "unus": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "updat": [10, 11, 14, 15, 17, 19, 21, 23, 32, 38, 40, 41, 42, 43, 44], "update_actor": [10, 21, 23, 40, 41, 44], "update_alpha": [10, 21, 23, 40, 41, 44], "update_crit": [10, 21, 23, 40, 41, 44], "update_hpo_config": [10, 11, 40, 41], "us": [2, 3, 4, 5, 7, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 32, 38, 39, 40, 41, 42, 43, 44, 45, 52], "util": [32, 38, 40, 55], "valid": [32, 40], "validate_shap": [32, 40], "valu": [13, 15, 19, 23, 32, 36, 37, 40, 41, 42, 43, 44, 47], "valueerror": [2, 4, 5, 38, 39], "varianc": [32, 40], "variou": [24, 25, 45], "vault": [6, 39], "vault_uuid": [6, 39], "view": [13, 41], "wa": [2, 4, 5, 6, 32, 38, 39, 40], "we": [7, 8, 39], "weigh": 52, "weight": [32, 40], "well": [6, 24, 25, 39, 45], "when": [16, 18, 22, 32, 40, 42, 43, 44], "where": [6, 39], "whether": [6, 7, 10, 11, 20, 39, 41], "which": [6, 16, 18, 22, 39, 42, 43, 44], "while": [7, 8, 39], "wise": [36, 37, 47], "work": [16, 18, 22, 42, 43, 44], "world": [49, 52], "wrap": [7, 8, 16, 18, 22, 33, 34, 39, 42, 43, 44, 46], "wrapper": [24, 30, 38, 40, 45], "write": [36, 37, 47, 49], "x": [16, 18, 22, 27, 42, 43, 44, 45], "xland": [24, 30, 31, 45], "xland_env": [38, 40], "xlandenv": [31, 40, 45], "yaml": [36, 37, 47], "yet": [16, 18, 22, 42, 43, 44], "your": [49, 51]}, "titles": ["Advanced Usage", "API References", "arlbench", "arlbench.arlbench", "arlbench.autorl", "arlbench.autorl.autorl_env", "arlbench.autorl.checkpointing", "arlbench.autorl.objectives", "arlbench.autorl.state_features", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.algorithm", "arlbench.core.algorithms.buffers", "arlbench.core.algorithms.common", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.dqn.dqn", "arlbench.core.algorithms.dqn.models", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.ppo.models", "arlbench.core.algorithms.ppo.ppo", "arlbench.core.algorithms.prioritised_item_buffer", "arlbench.core.algorithms.sac", "arlbench.core.algorithms.sac.models", "arlbench.core.algorithms.sac.sac", "arlbench.core.environments", "arlbench.core.environments.autorl_env", "arlbench.core.environments.brax_env", "arlbench.core.environments.envpool_env", "arlbench.core.environments.gymnasium_env", "arlbench.core.environments.gymnax_env", "arlbench.core.environments.make_env", "arlbench.core.environments.xland_env", "arlbench.core.running_statistics", "arlbench.core.wrappers", "arlbench.core.wrappers.flatten_observation", "arlbench.core.wrappers.wrapper", "arlbench.utils", "arlbench.utils.common", "arlbench package", "arlbench.autorl package", "arlbench.core package", "arlbench.core.algorithms package", "arlbench.core.algorithms.dqn package", "arlbench.core.algorithms.ppo package", "arlbench.core.algorithms.sac package", "arlbench.core.environments package", "arlbench.core.wrappers package", "arlbench.utils package", "Basic Usage", "Helpful Commands", "&lt;no title&gt;", "Frequently Asked Questions", "Glossary", "Home", "Installation", "arlbench"], "titleterms": {"advanc": 0, "algorithm": [10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 41, 42, 43, 44], "api": 1, "arlbench": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 55], "ask": 51, "autorl": [4, 5, 6, 7, 8, 39], "autorl_env": [5, 25, 39, 45], "basic": 48, "brax_env": [26, 45], "buffer": [12, 41], "checkpoint": [6, 39], "command": 49, "common": [13, 37, 41, 47], "content": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "core": [9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 40, 41, 42, 43, 44, 45, 46], "dqn": [14, 15, 16, 42], "environ": [24, 25, 26, 27, 28, 29, 30, 31, 45], "envpool_env": [27, 45], "flatten_observ": [34, 46], "frequent": 51, "glossari": 52, "gymnasium_env": [28, 45], "gymnax_env": [29, 45], "help": 49, "home": 53, "instal": 54, "make_env": [30, 45], "model": [16, 18, 22, 42, 43, 44], "modul": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "object": [7, 39], "packag": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "ppo": [17, 18, 19, 43], "prioritised_item_buff": [20, 41], "question": 51, "refer": 1, "running_statist": [32, 40], "sac": [21, 22, 23, 44], "state_featur": [8, 39], "submodul": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "subpackag": [38, 40, 41], "usag": [0, 48], "util": [36, 37, 47], "wrapper": [33, 34, 35, 46], "xland_env": [31, 45]}})
\ No newline at end of file
+Search.setIndex({"alltitles": {"API References": [[1, "api-references"]], "Advanced Usage": [[0, "advanced-usage"]], "Basic Usage": [[48, "basic-usage"]], "Frequently Asked Questions": [[51, "frequently-asked-questions"]], "Glossary": [[52, "glossary"]], "Helpful Commands": [[49, "helpful-commands"]], "Home": [[53, "home"]], "Installation": [[54, "installation"]], "Module contents": [[38, "module-arlbench"], [39, "module-arlbench.autorl"], [40, "module-arlbench.core"], [41, "module-arlbench.core.algorithms"], [42, "module-arlbench.core.algorithms.dqn"], [43, "module-arlbench.core.algorithms.ppo"], [44, "module-arlbench.core.algorithms.sac"], [45, "module-arlbench.core.environments"], [46, "module-arlbench.core.wrappers"], [47, "module-arlbench.utils"]], "Submodules": [[38, "submodules"], [39, "submodules"], [40, "submodules"], [41, "submodules"], [42, "submodules"], [43, "submodules"], [44, "submodules"], [45, "submodules"], [46, "submodules"], [47, "submodules"]], "Subpackages": [[38, "subpackages"], [40, "subpackages"], [41, "subpackages"]], "arlbench": [[2, "module-arlbench"], [55, "arlbench"]], "arlbench package": [[38, "arlbench-package"]], "arlbench.arlbench": [[3, "module-arlbench.arlbench"]], "arlbench.arlbench module": [[38, "module-arlbench.arlbench"]], "arlbench.autorl": [[4, "module-arlbench.autorl"]], "arlbench.autorl package": [[39, "arlbench-autorl-package"]], "arlbench.autorl.autorl_env": [[5, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.autorl_env module": [[39, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.checkpointing": [[6, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.checkpointing module": [[39, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.objectives": [[7, "module-arlbench.autorl.objectives"]], "arlbench.autorl.objectives module": [[39, "module-arlbench.autorl.objectives"]], "arlbench.autorl.state_features": [[8, "module-arlbench.autorl.state_features"]], "arlbench.autorl.state_features module": [[39, "module-arlbench.autorl.state_features"]], "arlbench.core": [[9, "module-arlbench.core"]], "arlbench.core package": [[40, "arlbench-core-package"]], "arlbench.core.algorithms": [[10, "module-arlbench.core.algorithms"]], "arlbench.core.algorithms package": [[41, "arlbench-core-algorithms-package"]], "arlbench.core.algorithms.algorithm": [[11, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.algorithm module": [[41, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.buffers": [[12, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.buffers module": [[41, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.common": [[13, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.common module": [[41, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.dqn": [[14, "module-arlbench.core.algorithms.dqn"]], "arlbench.core.algorithms.dqn package": [[42, "arlbench-core-algorithms-dqn-package"]], "arlbench.core.algorithms.dqn.dqn": [[15, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.dqn module": [[42, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.models": [[16, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.dqn.models module": [[42, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.ppo": [[17, "module-arlbench.core.algorithms.ppo"]], "arlbench.core.algorithms.ppo package": [[43, "arlbench-core-algorithms-ppo-package"]], "arlbench.core.algorithms.ppo.models": [[18, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.models module": [[43, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.ppo": [[19, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.ppo.ppo module": [[43, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.prioritised_item_buffer": [[20, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.prioritised_item_buffer module": [[41, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[21, "module-arlbench.core.algorithms.sac"]], "arlbench.core.algorithms.sac package": [[44, "arlbench-core-algorithms-sac-package"]], "arlbench.core.algorithms.sac.models": [[22, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.models module": [[44, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.sac": [[23, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.algorithms.sac.sac module": [[44, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.environments": [[24, "module-arlbench.core.environments"]], "arlbench.core.environments package": [[45, "arlbench-core-environments-package"]], "arlbench.core.environments.autorl_env": [[25, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.autorl_env module": [[45, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.brax_env": [[26, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.brax_env module": [[45, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.envpool_env": [[27, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.envpool_env module": [[45, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.gymnasium_env": [[28, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnasium_env module": [[45, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnax_env": [[29, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.gymnax_env module": [[45, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.make_env": [[30, "arlbench-core-environments-make-env"]], "arlbench.core.environments.make_env module": [[45, "module-arlbench.core.environments.make_env"]], "arlbench.core.environments.xland_env": [[31, "module-arlbench.core.environments.xland_env"]], "arlbench.core.environments.xland_env module": [[45, "module-arlbench.core.environments.xland_env"]], "arlbench.core.running_statistics": [[32, "module-arlbench.core.running_statistics"]], "arlbench.core.running_statistics module": [[40, "module-arlbench.core.running_statistics"]], "arlbench.core.wrappers": [[33, "module-arlbench.core.wrappers"]], "arlbench.core.wrappers package": [[46, "arlbench-core-wrappers-package"]], "arlbench.core.wrappers.flatten_observation": [[34, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.flatten_observation module": [[46, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.wrapper": [[35, "module-arlbench.core.wrappers.wrapper"]], "arlbench.core.wrappers.wrapper module": [[46, "module-arlbench.core.wrappers.wrapper"]], "arlbench.utils": [[36, "module-arlbench.utils"]], "arlbench.utils package": [[47, "arlbench-utils-package"]], "arlbench.utils.common": [[37, "module-arlbench.utils.common"]], "arlbench.utils.common module": [[47, "module-arlbench.utils.common"]]}, "docnames": ["advanced_usage/index", "api", "api/arlbench", "api/arlbench.arlbench", "api/arlbench.autorl", "api/arlbench.autorl.autorl_env", "api/arlbench.autorl.checkpointing", "api/arlbench.autorl.objectives", "api/arlbench.autorl.state_features", "api/arlbench.core", "api/arlbench.core.algorithms", "api/arlbench.core.algorithms.algorithm", "api/arlbench.core.algorithms.buffers", "api/arlbench.core.algorithms.common", "api/arlbench.core.algorithms.dqn", "api/arlbench.core.algorithms.dqn.dqn", "api/arlbench.core.algorithms.dqn.models", "api/arlbench.core.algorithms.ppo", "api/arlbench.core.algorithms.ppo.models", "api/arlbench.core.algorithms.ppo.ppo", "api/arlbench.core.algorithms.prioritised_item_buffer", "api/arlbench.core.algorithms.sac", "api/arlbench.core.algorithms.sac.models", "api/arlbench.core.algorithms.sac.sac", "api/arlbench.core.environments", "api/arlbench.core.environments.autorl_env", "api/arlbench.core.environments.brax_env", "api/arlbench.core.environments.envpool_env", "api/arlbench.core.environments.gymnasium_env", "api/arlbench.core.environments.gymnax_env", "api/arlbench.core.environments.make_env", "api/arlbench.core.environments.xland_env", "api/arlbench.core.running_statistics", "api/arlbench.core.wrappers", "api/arlbench.core.wrappers.flatten_observation", "api/arlbench.core.wrappers.wrapper", "api/arlbench.utils", "api/arlbench.utils.common", "arlbench", "arlbench.autorl", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.sac", "arlbench.core.environments", "arlbench.core.wrappers", "arlbench.utils", "basic_usage/index", "commands", "contributing", "faq", "glossary", "index", "installation", "modules"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["advanced_usage/index.rst", "api.rst", "api/arlbench.rst", "api/arlbench.arlbench.rst", "api/arlbench.autorl.rst", "api/arlbench.autorl.autorl_env.rst", "api/arlbench.autorl.checkpointing.rst", "api/arlbench.autorl.objectives.rst", "api/arlbench.autorl.state_features.rst", "api/arlbench.core.rst", "api/arlbench.core.algorithms.rst", "api/arlbench.core.algorithms.algorithm.rst", "api/arlbench.core.algorithms.buffers.rst", "api/arlbench.core.algorithms.common.rst", "api/arlbench.core.algorithms.dqn.rst", "api/arlbench.core.algorithms.dqn.dqn.rst", "api/arlbench.core.algorithms.dqn.models.rst", "api/arlbench.core.algorithms.ppo.rst", "api/arlbench.core.algorithms.ppo.models.rst", "api/arlbench.core.algorithms.ppo.ppo.rst", "api/arlbench.core.algorithms.prioritised_item_buffer.rst", "api/arlbench.core.algorithms.sac.rst", "api/arlbench.core.algorithms.sac.models.rst", "api/arlbench.core.algorithms.sac.sac.rst", "api/arlbench.core.environments.rst", "api/arlbench.core.environments.autorl_env.rst", "api/arlbench.core.environments.brax_env.rst", "api/arlbench.core.environments.envpool_env.rst", "api/arlbench.core.environments.gymnasium_env.rst", "api/arlbench.core.environments.gymnax_env.rst", "api/arlbench.core.environments.make_env.rst", "api/arlbench.core.environments.xland_env.rst", "api/arlbench.core.running_statistics.rst", "api/arlbench.core.wrappers.rst", "api/arlbench.core.wrappers.flatten_observation.rst", "api/arlbench.core.wrappers.wrapper.rst", "api/arlbench.utils.rst", "api/arlbench.utils.common.rst", "arlbench.rst", "arlbench.autorl.rst", "arlbench.core.rst", "arlbench.core.algorithms.rst", "arlbench.core.algorithms.dqn.rst", "arlbench.core.algorithms.ppo.rst", "arlbench.core.algorithms.sac.rst", "arlbench.core.environments.rst", "arlbench.core.wrappers.rst", "arlbench.utils.rst", "basic_usage/index.rst", "commands.rst", "contributing.rst", "faq.rst", "glossary.rst", "index.rst", "installation.rst", "modules.rst"], "indexentries": {"__call__() (arlbench.autorl.objectives.emissions static method)": [[7, "arlbench.autorl.objectives.Emissions.__call__", false], [39, "arlbench.autorl.objectives.Emissions.__call__", false]], "__call__() (arlbench.autorl.objectives.objective static method)": [[7, "arlbench.autorl.objectives.Objective.__call__", false], [39, "arlbench.autorl.objectives.Objective.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardmean static method)": [[7, "arlbench.autorl.objectives.RewardMean.__call__", false], [39, "arlbench.autorl.objectives.RewardMean.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardstd static method)": [[7, "arlbench.autorl.objectives.RewardStd.__call__", false], [39, "arlbench.autorl.objectives.RewardStd.__call__", false]], "__call__() (arlbench.autorl.objectives.runtime static method)": [[7, "arlbench.autorl.objectives.Runtime.__call__", false], [39, "arlbench.autorl.objectives.Runtime.__call__", false]], "__call__() (arlbench.autorl.state_features.gradinfo static method)": [[8, "arlbench.autorl.state_features.GradInfo.__call__", false], [39, "arlbench.autorl.state_features.GradInfo.__call__", false]], "__call__() (arlbench.autorl.state_features.statefeature static method)": [[8, "arlbench.autorl.state_features.StateFeature.__call__", false], [39, "arlbench.autorl.state_features.StateFeature.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.cnnq method)": [[16, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false], [42, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.mlpq method)": [[16, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false], [42, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false], [43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false], [43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.alphacoef method)": [[22, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false], [44, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacvectorcritic method)": [[22, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false], [44, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false]], "__lt__() (arlbench.autorl.objectives.objective method)": [[7, "arlbench.autorl.objectives.Objective.__lt__", false], [39, "arlbench.autorl.objectives.Objective.__lt__", false]], "__new__() (arlbench.autorl.objectives.objective static method)": [[7, "arlbench.autorl.objectives.Objective.__new__", false], [39, "arlbench.autorl.objectives.Objective.__new__", false]], "__new__() (arlbench.autorl.state_features.statefeature static method)": [[8, "arlbench.autorl.state_features.StateFeature.__new__", false], [39, "arlbench.autorl.state_features.StateFeature.__new__", false]], "action (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.action", false]], "action (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.action", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.action", false]], "action (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.action", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.action", false]], "action (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.action", false], [44, "arlbench.core.algorithms.sac.sac.Transition.action", false]], "action_dim (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.action_dim", false]], "action_dim (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.action_dim", false]], "action_space (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false]], "action_space (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.action_space", false], [39, "arlbench.autorl.AutoRLEnv.action_space", false]], "action_space (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.action_space", false], [38, "arlbench.AutoRLEnv.action_space", false]], "action_space (arlbench.core.environments.brax_env.braxenv property)": [[26, "arlbench.core.environments.brax_env.BraxEnv.action_space", false], [45, "arlbench.core.environments.brax_env.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.braxenv property)": [[24, "arlbench.core.environments.BraxEnv.action_space", false], [45, "arlbench.core.environments.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[27, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false], [45, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.envpoolenv property)": [[24, "arlbench.core.environments.EnvpoolEnv.action_space", false], [45, "arlbench.core.environments.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[28, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false], [45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasiumenv property)": [[24, "arlbench.core.environments.GymnasiumEnv.action_space", false], [45, "arlbench.core.environments.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[29, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false], [45, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.gymnaxenv property)": [[24, "arlbench.core.environments.GymnaxEnv.action_space", false], [45, "arlbench.core.environments.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.xland_env.xlandenv property)": [[31, "arlbench.core.environments.xland_env.XLandEnv.action_space", false], [45, "arlbench.core.environments.xland_env.XLandEnv.action_space", false]], "action_space() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.action_space", false], [45, "arlbench.core.environments.autorl_env.Environment.action_space", false]], "action_space() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.action_space", false], [45, "arlbench.core.environments.Environment.action_space", false]], "action_type (arlbench.core.algorithms.algorithm property)": [[10, "arlbench.core.algorithms.Algorithm.action_type", false], [41, "arlbench.core.algorithms.Algorithm.action_type", false]], "action_type (arlbench.core.algorithms.algorithm.algorithm property)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false]], "activation (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.activation", false]], "activation (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.activation", false]], "activation (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.activation", false]], "activation (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.activation", false]], "actor_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false]], "actor_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false], [44, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false]], "actor_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false]], "actor_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false], [44, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false]], "actor_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false]], "actor_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false]], "advantages (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false]], "advantages (arlbench.core.algorithms.ppo.ppometrics attribute)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false]], "algorithm (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.Algorithm", false], [41, "arlbench.core.algorithms.Algorithm", false]], "algorithm (class in arlbench.core.algorithms.algorithm)": [[11, "arlbench.core.algorithms.algorithm.Algorithm", false], [41, "arlbench.core.algorithms.algorithm.Algorithm", false]], "algorithms (arlbench.autorl.autorl_env.autorlenv attribute)": [[39, "arlbench.autorl.autorl_env.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorl.autorlenv attribute)": [[39, "arlbench.autorl.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorlenv attribute)": [[38, "arlbench.AutoRLEnv.ALGORITHMS", false]], "alpha_init (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.alpha_init", false]], "alpha_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false]], "alpha_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false], [44, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false]], "alpha_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false]], "alpha_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false]], "alphacoef (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.AlphaCoef", false], [44, "arlbench.core.algorithms.sac.models.AlphaCoef", false]], "arlbench": [[2, "module-arlbench", false], [38, "module-arlbench", false]], "arlbench.arlbench": [[3, "module-arlbench.arlbench", false], [38, "module-arlbench.arlbench", false]], "arlbench.autorl": [[4, "module-arlbench.autorl", false], [39, "module-arlbench.autorl", false]], "arlbench.autorl.autorl_env": [[5, "module-arlbench.autorl.autorl_env", false], [39, "module-arlbench.autorl.autorl_env", false]], "arlbench.autorl.checkpointing": [[6, "module-arlbench.autorl.checkpointing", false], [39, "module-arlbench.autorl.checkpointing", false]], "arlbench.autorl.objectives": [[7, "module-arlbench.autorl.objectives", false], [39, "module-arlbench.autorl.objectives", false]], "arlbench.autorl.state_features": [[8, "module-arlbench.autorl.state_features", false], [39, "module-arlbench.autorl.state_features", false]], "arlbench.core": [[9, "module-arlbench.core", false], [40, "module-arlbench.core", false]], "arlbench.core.algorithms": [[10, "module-arlbench.core.algorithms", false], [41, "module-arlbench.core.algorithms", false]], "arlbench.core.algorithms.algorithm": [[11, "module-arlbench.core.algorithms.algorithm", false], [41, "module-arlbench.core.algorithms.algorithm", false]], "arlbench.core.algorithms.buffers": [[12, "module-arlbench.core.algorithms.buffers", false], [41, "module-arlbench.core.algorithms.buffers", false]], "arlbench.core.algorithms.common": [[13, "module-arlbench.core.algorithms.common", false], [41, "module-arlbench.core.algorithms.common", false]], "arlbench.core.algorithms.dqn": [[14, "module-arlbench.core.algorithms.dqn", false], [42, "module-arlbench.core.algorithms.dqn", false]], "arlbench.core.algorithms.dqn.dqn": [[15, "module-arlbench.core.algorithms.dqn.dqn", false], [42, "module-arlbench.core.algorithms.dqn.dqn", false]], "arlbench.core.algorithms.dqn.models": [[16, "module-arlbench.core.algorithms.dqn.models", false], [42, "module-arlbench.core.algorithms.dqn.models", false]], "arlbench.core.algorithms.ppo": [[17, "module-arlbench.core.algorithms.ppo", false], [43, "module-arlbench.core.algorithms.ppo", false]], "arlbench.core.algorithms.ppo.models": [[18, "module-arlbench.core.algorithms.ppo.models", false], [43, "module-arlbench.core.algorithms.ppo.models", false]], "arlbench.core.algorithms.ppo.ppo": [[19, "module-arlbench.core.algorithms.ppo.ppo", false], [43, "module-arlbench.core.algorithms.ppo.ppo", false]], "arlbench.core.algorithms.prioritised_item_buffer": [[20, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [41, "module-arlbench.core.algorithms.prioritised_item_buffer", false]], "arlbench.core.algorithms.sac": [[21, "module-arlbench.core.algorithms.sac", false], [44, "module-arlbench.core.algorithms.sac", false]], "arlbench.core.algorithms.sac.models": [[22, "module-arlbench.core.algorithms.sac.models", false], [44, "module-arlbench.core.algorithms.sac.models", false]], "arlbench.core.algorithms.sac.sac": [[23, "module-arlbench.core.algorithms.sac.sac", false], [44, "module-arlbench.core.algorithms.sac.sac", false]], "arlbench.core.environments": [[24, "module-arlbench.core.environments", false], [45, "module-arlbench.core.environments", false]], "arlbench.core.environments.autorl_env": [[25, "module-arlbench.core.environments.autorl_env", false], [45, "module-arlbench.core.environments.autorl_env", false]], "arlbench.core.environments.brax_env": [[26, "module-arlbench.core.environments.brax_env", false], [45, "module-arlbench.core.environments.brax_env", false]], "arlbench.core.environments.envpool_env": [[27, "module-arlbench.core.environments.envpool_env", false], [45, "module-arlbench.core.environments.envpool_env", false]], "arlbench.core.environments.gymnasium_env": [[28, "module-arlbench.core.environments.gymnasium_env", false], [45, "module-arlbench.core.environments.gymnasium_env", false]], "arlbench.core.environments.gymnax_env": [[29, "module-arlbench.core.environments.gymnax_env", false], [45, "module-arlbench.core.environments.gymnax_env", false]], "arlbench.core.environments.make_env": [[45, "module-arlbench.core.environments.make_env", false]], "arlbench.core.environments.xland_env": [[31, "module-arlbench.core.environments.xland_env", false], [45, "module-arlbench.core.environments.xland_env", false]], "arlbench.core.running_statistics": [[32, "module-arlbench.core.running_statistics", false], [40, "module-arlbench.core.running_statistics", false]], "arlbench.core.wrappers": [[33, "module-arlbench.core.wrappers", false], [46, "module-arlbench.core.wrappers", false]], "arlbench.core.wrappers.flatten_observation": [[34, "module-arlbench.core.wrappers.flatten_observation", false], [46, "module-arlbench.core.wrappers.flatten_observation", false]], "arlbench.core.wrappers.wrapper": [[35, "module-arlbench.core.wrappers.wrapper", false], [46, "module-arlbench.core.wrappers.wrapper", false]], "arlbench.utils": [[36, "module-arlbench.utils", false], [47, "module-arlbench.utils", false]], "arlbench.utils.common": [[37, "module-arlbench.utils.common", false], [47, "module-arlbench.utils.common", false]], "automl": [[52, "term-AutoML", true]], "autorl": [[52, "term-AutoRL", true]], "autorlenv (class in arlbench)": [[2, "arlbench.AutoRLEnv", false], [38, "arlbench.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl)": [[4, "arlbench.autorl.AutoRLEnv", false], [39, "arlbench.autorl.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl.autorl_env)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv", false]], "bo": [[52, "term-BO", true]], "braxenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.BraxEnv", false], [45, "arlbench.core.environments.BraxEnv", false]], "braxenv (class in arlbench.core.environments.brax_env)": [[26, "arlbench.core.environments.brax_env.BraxEnv", false], [45, "arlbench.core.environments.brax_env.BraxEnv", false]], "buffer_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false], [42, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[17, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false], [43, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false], [44, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sacstate attribute)": [[21, "arlbench.core.algorithms.sac.SACState.buffer_state", false], [44, "arlbench.core.algorithms.sac.SACState.buffer_state", false]], "checkpointer (class in arlbench.autorl.checkpointing)": [[6, "arlbench.autorl.checkpointing.Checkpointer", false], [39, "arlbench.autorl.checkpointing.Checkpointer", false]], "checkpoints (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.checkpoints", false], [39, "arlbench.autorl.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.checkpoints", false], [38, "arlbench.AutoRLEnv.checkpoints", false]], "cnnactorcritic (class in arlbench.core.algorithms.ppo.models)": [[18, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false], [43, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false]], "cnnq (class in arlbench.core.algorithms.dqn.models)": [[16, "arlbench.core.algorithms.dqn.models.CNNQ", false], [42, "arlbench.core.algorithms.dqn.models.CNNQ", false]], "config (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.config", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.config", false]], "config (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.config", false], [39, "arlbench.autorl.AutoRLEnv.config", false]], "config (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.config", false], [38, "arlbench.AutoRLEnv.config", false]], "config_space (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false]], "config_space (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.config_space", false], [39, "arlbench.autorl.AutoRLEnv.config_space", false]], "config_space (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.config_space", false], [38, "arlbench.AutoRLEnv.config_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils)": [[36, "arlbench.utils.config_space_to_gymnasium_space", false], [47, "arlbench.utils.config_space_to_gymnasium_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.config_space_to_gymnasium_space", false], [47, "arlbench.utils.common.config_space_to_gymnasium_space", false]], "config_space_to_yaml() (in module arlbench.utils)": [[36, "arlbench.utils.config_space_to_yaml", false], [47, "arlbench.utils.config_space_to_yaml", false]], "config_space_to_yaml() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.config_space_to_yaml", false], [47, "arlbench.utils.common.config_space_to_yaml", false]], "count (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[40, "arlbench.core.running_statistics.RunningStatisticsState.count", false]], "create_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[20, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false], [41, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false]], "create_with_opt_state() (arlbench.core.algorithms.dqn.dqn.dqntrainstate class method)": [[42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.ppo.ppo.ppotrainstate class method)": [[43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.sac.sac.sactrainstate class method)": [[44, "arlbench.core.algorithms.sac.sac.SACTrainState.create_with_opt_state", false]], "critic (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.critic", false]], "critic_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false]], "critic_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false], [44, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false]], "critic_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false]], "critic_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false], [44, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false]], "critic_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false]], "critic_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false]], "cur_rewards (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false]], "cur_rewards (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false]], "denormalize() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.denormalize", false], [40, "arlbench.core.running_statistics.denormalize", false]], "discrete (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.discrete", false]], "discrete (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.discrete", false]], "done (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.done", false]], "done (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.done", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.done", false]], "done (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.done", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.done", false]], "done (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.done", false], [44, "arlbench.core.algorithms.sac.sac.Transition.done", false]], "dqn": [[52, "term-DQN", true]], "dqn (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.DQN", false], [41, "arlbench.core.algorithms.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQN", false], [42, "arlbench.core.algorithms.dqn.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false]], "dqnstate (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNState", false], [42, "arlbench.core.algorithms.dqn.DQNState", false]], "dqnstate (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNState", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNState", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false]], "dqntrainreturnt (in module arlbench.core.algorithms.dqn)": [[14, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false], [42, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false]], "dqntrainstate (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false]], "emissions (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.Emissions", false], [39, "arlbench.autorl.objectives.Emissions", false]], "env_name (arlbench.core.environments.autorl_env.environment property)": [[25, "arlbench.core.environments.autorl_env.Environment.env_name", false], [45, "arlbench.core.environments.autorl_env.Environment.env_name", false]], "env_name (arlbench.core.environments.environment property)": [[24, "arlbench.core.environments.Environment.env_name", false], [45, "arlbench.core.environments.Environment.env_name", false]], "env_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false]], "environment (class in arlbench.core.environments)": [[24, "arlbench.core.environments.Environment", false], [45, "arlbench.core.environments.Environment", false]], "environment (class in arlbench.core.environments.autorl_env)": [[25, "arlbench.core.environments.autorl_env.Environment", false], [45, "arlbench.core.environments.autorl_env.Environment", false]], "envpoolenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.EnvpoolEnv", false], [45, "arlbench.core.environments.EnvpoolEnv", false]], "envpoolenv (class in arlbench.core.environments.envpool_env)": [[27, "arlbench.core.environments.envpool_env.EnvpoolEnv", false], [45, "arlbench.core.environments.envpool_env.EnvpoolEnv", false]], "eval() (arlbench.autorl.autorl_env.autorlenv method)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false]], "eval() (arlbench.autorl.autorlenv method)": [[4, "arlbench.autorl.AutoRLEnv.eval", false], [39, "arlbench.autorl.AutoRLEnv.eval", false]], "eval() (arlbench.autorlenv method)": [[2, "arlbench.AutoRLEnv.eval", false], [38, "arlbench.AutoRLEnv.eval", false]], "eval() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.eval", false], [41, "arlbench.core.algorithms.Algorithm.eval", false]], "eval() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.eval", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.eval", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false]], "flattenobservationwrapper (class in arlbench.core.wrappers)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper", false]], "flattenobservationwrapper (class in arlbench.core.wrappers.flatten_observation)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false]], "from_tuple() (arlbench.core.algorithms.common.timestep method)": [[41, "arlbench.core.algorithms.common.TimeStep.from_tuple", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false], [42, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false], [43, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false], [41, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false], [41, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_default_hpo_config", false], [41, "arlbench.core.algorithms.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false], [42, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_default_hpo_config", false], [41, "arlbench.core.algorithms.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false], [43, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_default_hpo_config", false], [41, "arlbench.core.algorithms.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false], [44, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false], [41, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_default_nas_config", false], [41, "arlbench.core.algorithms.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false], [42, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_default_nas_config", false], [41, "arlbench.core.algorithms.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false], [43, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_default_nas_config", false], [41, "arlbench.core.algorithms.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false], [44, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false], [41, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_hpo_config_space", false], [41, "arlbench.core.algorithms.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false], [42, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_hpo_config_space", false], [41, "arlbench.core.algorithms.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false], [43, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_hpo_config_space", false], [41, "arlbench.core.algorithms.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false], [44, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false], [41, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_hpo_search_space", false], [41, "arlbench.core.algorithms.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false], [42, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_hpo_search_space", false], [41, "arlbench.core.algorithms.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false], [43, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_hpo_search_space", false], [41, "arlbench.core.algorithms.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false], [44, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm static method)": [[10, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false], [41, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn static method)": [[10, "arlbench.core.algorithms.DQN.get_nas_config_space", false], [41, "arlbench.core.algorithms.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[14, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false], [42, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo static method)": [[10, "arlbench.core.algorithms.PPO.get_nas_config_space", false], [41, "arlbench.core.algorithms.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[17, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false], [43, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac static method)": [[10, "arlbench.core.algorithms.SAC.get_nas_config_space", false], [41, "arlbench.core.algorithms.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac static method)": [[21, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false], [44, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false], [44, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false]], "get_spec() (arlbench.autorl.objectives.emissions static method)": [[7, "arlbench.autorl.objectives.Emissions.get_spec", false], [39, "arlbench.autorl.objectives.Emissions.get_spec", false]], "get_spec() (arlbench.autorl.objectives.objective static method)": [[7, "arlbench.autorl.objectives.Objective.get_spec", false], [39, "arlbench.autorl.objectives.Objective.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardmean static method)": [[7, "arlbench.autorl.objectives.RewardMean.get_spec", false], [39, "arlbench.autorl.objectives.RewardMean.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardstd static method)": [[7, "arlbench.autorl.objectives.RewardStd.get_spec", false], [39, "arlbench.autorl.objectives.RewardStd.get_spec", false]], "get_spec() (arlbench.autorl.objectives.runtime static method)": [[7, "arlbench.autorl.objectives.Runtime.get_spec", false], [39, "arlbench.autorl.objectives.Runtime.get_spec", false]], "get_state_space() (arlbench.autorl.state_features.gradinfo static method)": [[8, "arlbench.autorl.state_features.GradInfo.get_state_space", false], [39, "arlbench.autorl.state_features.GradInfo.get_state_space", false]], "get_state_space() (arlbench.autorl.state_features.statefeature static method)": [[8, "arlbench.autorl.state_features.StateFeature.get_state_space", false], [39, "arlbench.autorl.state_features.StateFeature.get_state_space", false]], "global_step (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false]], "gradinfo (class in arlbench.autorl.state_features)": [[8, "arlbench.autorl.state_features.GradInfo", false], [39, "arlbench.autorl.state_features.GradInfo", false]], "grads (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppometrics attribute)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils)": [[36, "arlbench.utils.gymnasium_space_to_gymnax_space", false], [47, "arlbench.utils.gymnasium_space_to_gymnax_space", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false], [47, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false]], "gymnasiumenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.GymnasiumEnv", false], [45, "arlbench.core.environments.GymnasiumEnv", false]], "gymnasiumenv (class in arlbench.core.environments.gymnasium_env)": [[28, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false], [45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false]], "gymnaxenv (class in arlbench.core.environments)": [[24, "arlbench.core.environments.GymnaxEnv", false], [45, "arlbench.core.environments.GymnaxEnv", false]], "gymnaxenv (class in arlbench.core.environments.gymnax_env)": [[29, "arlbench.core.environments.gymnax_env.GymnaxEnv", false], [45, "arlbench.core.environments.gymnax_env.GymnaxEnv", false]], "hidden_size (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.hidden_size", false]], "hpo": [[52, "term-HPO", true]], "hpo_config (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.hpo_config", false], [39, "arlbench.autorl.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.hpo_config", false], [38, "arlbench.AutoRLEnv.hpo_config", false]], "info (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.info", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.info", false]], "info (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.info", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.info", false]], "info (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.info", false], [44, "arlbench.core.algorithms.sac.sac.Transition.info", false]], "init() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.init", false], [41, "arlbench.core.algorithms.Algorithm.init", false]], "init() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.init", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.init", false]], "init() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.init", false], [41, "arlbench.core.algorithms.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.init", false], [42, "arlbench.core.algorithms.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.init", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.ppo method)": [[10, "arlbench.core.algorithms.PPO.init", false], [41, "arlbench.core.algorithms.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo method)": [[17, "arlbench.core.algorithms.ppo.PPO.init", false], [43, "arlbench.core.algorithms.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.init", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.init", false], [41, "arlbench.core.algorithms.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.init", false], [44, "arlbench.core.algorithms.sac.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.init", false], [44, "arlbench.core.algorithms.sac.sac.SAC.init", false]], "init_state() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.init_state", false], [40, "arlbench.core.running_statistics.init_state", false]], "items() (arlbench.core.algorithms.common.timestep method)": [[13, "arlbench.core.algorithms.common.TimeStep.items", false], [41, "arlbench.core.algorithms.common.TimeStep.items", false]], "key (arlbench.autorl.objectives.emissions attribute)": [[39, "arlbench.autorl.objectives.Emissions.KEY", false]], "key (arlbench.autorl.objectives.objective attribute)": [[39, "arlbench.autorl.objectives.Objective.KEY", false]], "key (arlbench.autorl.objectives.rewardmean attribute)": [[39, "arlbench.autorl.objectives.RewardMean.KEY", false]], "key (arlbench.autorl.objectives.rewardstd attribute)": [[39, "arlbench.autorl.objectives.RewardStd.KEY", false]], "key (arlbench.autorl.objectives.runtime attribute)": [[39, "arlbench.autorl.objectives.Runtime.KEY", false]], "key (arlbench.autorl.state_features.gradinfo attribute)": [[39, "arlbench.autorl.state_features.GradInfo.KEY", false]], "key (arlbench.autorl.state_features.statefeature attribute)": [[39, "arlbench.autorl.state_features.StateFeature.KEY", false]], "keys() (arlbench.core.algorithms.common.timestep method)": [[13, "arlbench.core.algorithms.common.TimeStep.keys", false], [41, "arlbench.core.algorithms.common.TimeStep.keys", false]], "last_obs (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.last_obs", false]], "load() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.load", false], [39, "arlbench.autorl.checkpointing.Checkpointer.load", false]], "load_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false], [39, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false]], "log_prob (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false]], "log_std_max (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_max", false]], "log_std_max (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_max", false]], "log_std_min (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_min", false]], "log_std_min (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_min", false]], "loss (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppometrics attribute)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false]], "make_env() (in module arlbench.core.environments)": [[24, "arlbench.core.environments.make_env", false], [30, "arlbench.core.environments.make_env", false], [45, "arlbench.core.environments.make_env", false]], "make_env() (in module arlbench.core.environments.make_env)": [[45, "arlbench.core.environments.make_env.make_env", false]], "make_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[20, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false], [41, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false]], "mean (arlbench.core.running_statistics.nestedmeanstd attribute)": [[40, "arlbench.core.running_statistics.NestedMeanStd.mean", false]], "metrics (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false]], "mlpactorcritic (class in arlbench.core.algorithms.ppo.models)": [[18, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false], [43, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false]], "mlpq (class in arlbench.core.algorithms.dqn.models)": [[16, "arlbench.core.algorithms.dqn.models.MLPQ", false], [42, "arlbench.core.algorithms.dqn.models.MLPQ", false]], "mode() (arlbench.core.algorithms.sac.models.tanhtransformeddistribution method)": [[22, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false], [44, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false]], "module": [[2, "module-arlbench", false], [3, "module-arlbench.arlbench", false], [4, "module-arlbench.autorl", false], [5, "module-arlbench.autorl.autorl_env", false], [6, "module-arlbench.autorl.checkpointing", false], [7, "module-arlbench.autorl.objectives", false], [8, "module-arlbench.autorl.state_features", false], [9, "module-arlbench.core", false], [10, "module-arlbench.core.algorithms", false], [11, "module-arlbench.core.algorithms.algorithm", false], [12, "module-arlbench.core.algorithms.buffers", false], [13, "module-arlbench.core.algorithms.common", false], [14, "module-arlbench.core.algorithms.dqn", false], [15, "module-arlbench.core.algorithms.dqn.dqn", false], [16, "module-arlbench.core.algorithms.dqn.models", false], [17, "module-arlbench.core.algorithms.ppo", false], [18, "module-arlbench.core.algorithms.ppo.models", false], [19, "module-arlbench.core.algorithms.ppo.ppo", false], [20, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [21, "module-arlbench.core.algorithms.sac", false], [22, "module-arlbench.core.algorithms.sac.models", false], [23, "module-arlbench.core.algorithms.sac.sac", false], [24, "module-arlbench.core.environments", false], [25, "module-arlbench.core.environments.autorl_env", false], [26, "module-arlbench.core.environments.brax_env", false], [27, "module-arlbench.core.environments.envpool_env", false], [28, "module-arlbench.core.environments.gymnasium_env", false], [29, "module-arlbench.core.environments.gymnax_env", false], [31, "module-arlbench.core.environments.xland_env", false], [32, "module-arlbench.core.running_statistics", false], [33, "module-arlbench.core.wrappers", false], [34, "module-arlbench.core.wrappers.flatten_observation", false], [35, "module-arlbench.core.wrappers.wrapper", false], [36, "module-arlbench.utils", false], [37, "module-arlbench.utils.common", false], [38, "module-arlbench", false], [38, "module-arlbench.arlbench", false], [39, "module-arlbench.autorl", false], [39, "module-arlbench.autorl.autorl_env", false], [39, "module-arlbench.autorl.checkpointing", false], [39, "module-arlbench.autorl.objectives", false], [39, "module-arlbench.autorl.state_features", false], [40, "module-arlbench.core", false], [40, "module-arlbench.core.running_statistics", false], [41, "module-arlbench.core.algorithms", false], [41, "module-arlbench.core.algorithms.algorithm", false], [41, "module-arlbench.core.algorithms.buffers", false], [41, "module-arlbench.core.algorithms.common", false], [41, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [42, "module-arlbench.core.algorithms.dqn", false], [42, "module-arlbench.core.algorithms.dqn.dqn", false], [42, "module-arlbench.core.algorithms.dqn.models", false], [43, "module-arlbench.core.algorithms.ppo", false], [43, "module-arlbench.core.algorithms.ppo.models", false], [43, "module-arlbench.core.algorithms.ppo.ppo", false], [44, "module-arlbench.core.algorithms.sac", false], [44, "module-arlbench.core.algorithms.sac.models", false], [44, "module-arlbench.core.algorithms.sac.sac", false], [45, "module-arlbench.core.environments", false], [45, "module-arlbench.core.environments.autorl_env", false], [45, "module-arlbench.core.environments.brax_env", false], [45, "module-arlbench.core.environments.envpool_env", false], [45, "module-arlbench.core.environments.gymnasium_env", false], [45, "module-arlbench.core.environments.gymnax_env", false], [45, "module-arlbench.core.environments.make_env", false], [45, "module-arlbench.core.environments.xland_env", false], [46, "module-arlbench.core.wrappers", false], [46, "module-arlbench.core.wrappers.flatten_observation", false], [46, "module-arlbench.core.wrappers.wrapper", false], [47, "module-arlbench.utils", false], [47, "module-arlbench.utils.common", false]], "mrp_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[39, "arlbench.autorl.checkpointing.Checkpointer.MRP_FILE", false]], "multi-fidelity optimization": [[52, "term-Multi-fidelity-optimization", true]], "n_critics (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.n_critics", false]], "n_envs (arlbench.core.environments.autorl_env.environment property)": [[25, "arlbench.core.environments.autorl_env.Environment.n_envs", false], [45, "arlbench.core.environments.autorl_env.Environment.n_envs", false]], "n_envs (arlbench.core.environments.environment property)": [[24, "arlbench.core.environments.Environment.n_envs", false], [45, "arlbench.core.environments.Environment.n_envs", false]], "name (arlbench.core.algorithms.algorithm attribute)": [[41, "arlbench.core.algorithms.Algorithm.name", false]], "name (arlbench.core.algorithms.algorithm.algorithm attribute)": [[41, "arlbench.core.algorithms.algorithm.Algorithm.name", false]], "name (arlbench.core.algorithms.dqn attribute)": [[41, "arlbench.core.algorithms.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn attribute)": [[42, "arlbench.core.algorithms.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn.dqn attribute)": [[42, "arlbench.core.algorithms.dqn.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.name", false]], "name (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.name", false]], "name (arlbench.core.algorithms.ppo attribute)": [[41, "arlbench.core.algorithms.PPO.name", false]], "name (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.ppo attribute)": [[43, "arlbench.core.algorithms.ppo.PPO.name", false]], "name (arlbench.core.algorithms.ppo.ppo.ppo attribute)": [[43, "arlbench.core.algorithms.ppo.ppo.PPO.name", false]], "name (arlbench.core.algorithms.sac attribute)": [[41, "arlbench.core.algorithms.SAC.name", false]], "name (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.name", false]], "name (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.name", false]], "name (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.name", false]], "name (arlbench.core.algorithms.sac.sac attribute)": [[44, "arlbench.core.algorithms.sac.SAC.name", false]], "name (arlbench.core.algorithms.sac.sac.sac attribute)": [[44, "arlbench.core.algorithms.sac.sac.SAC.name", false]], "nestedmeanstd (class in arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.NestedMeanStd", false], [40, "arlbench.core.running_statistics.NestedMeanStd", false]], "network_state (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[44, "arlbench.core.algorithms.sac.sac.SACTrainState.network_state", false]], "nodes_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[39, "arlbench.autorl.checkpointing.Checkpointer.NODES_FILE", false]], "normalize() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.normalize", false], [40, "arlbench.core.running_statistics.normalize", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false]], "numpy_to_jax() (in module arlbench.core.environments.envpool_env)": [[27, "arlbench.core.environments.envpool_env.numpy_to_jax", false], [45, "arlbench.core.environments.envpool_env.numpy_to_jax", false]], "objective (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.Objective", false], [39, "arlbench.autorl.objectives.Objective", false]], "objectives (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false]], "objectives (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.objectives", false], [39, "arlbench.autorl.AutoRLEnv.objectives", false]], "objectives (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.objectives", false], [38, "arlbench.AutoRLEnv.objectives", false]], "obs (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false]], "obs (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false]], "obs (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.obs", false], [44, "arlbench.core.algorithms.sac.sac.Transition.obs", false]], "obs (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.obs", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.obs", false]], "observation_space (arlbench.autorl.autorl_env.autorlenv property)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorl.autorlenv property)": [[4, "arlbench.autorl.AutoRLEnv.observation_space", false], [39, "arlbench.autorl.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorlenv property)": [[2, "arlbench.AutoRLEnv.observation_space", false], [38, "arlbench.AutoRLEnv.observation_space", false]], "observation_space (arlbench.core.environments.brax_env.braxenv property)": [[26, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false], [45, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.braxenv property)": [[24, "arlbench.core.environments.BraxEnv.observation_space", false], [45, "arlbench.core.environments.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[27, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false], [45, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpoolenv property)": [[24, "arlbench.core.environments.EnvpoolEnv.observation_space", false], [45, "arlbench.core.environments.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[28, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false], [45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasiumenv property)": [[24, "arlbench.core.environments.GymnasiumEnv.observation_space", false], [45, "arlbench.core.environments.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[29, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false], [45, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnaxenv property)": [[24, "arlbench.core.environments.GymnaxEnv.observation_space", false], [45, "arlbench.core.environments.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.xland_env.xlandenv property)": [[31, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false], [45, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false]], "observation_space (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper property)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false]], "observation_space (arlbench.core.wrappers.flattenobservationwrapper property)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false]], "observation_space() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.observation_space", false], [45, "arlbench.core.environments.autorl_env.Environment.observation_space", false]], "observation_space() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.observation_space", false], [45, "arlbench.core.environments.Environment.observation_space", false]], "opt_state (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.opt_state", false]], "opt_state (arlbench.core.algorithms.ppo.ppo.ppotrainstate attribute)": [[43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.opt_state", false]], "parent (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.parent", false]], "parent (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.parent", false]], "parent (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.parent", false]], "parent (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.parent", false]], "ppo": [[52, "term-PPO", true]], "ppo (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.PPO", false], [41, "arlbench.core.algorithms.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPO", false], [43, "arlbench.core.algorithms.ppo.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO", false]], "ppometrics (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOMetrics", false], [43, "arlbench.core.algorithms.ppo.PPOMetrics", false]], "ppometrics (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false]], "ppostate (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOState", false], [43, "arlbench.core.algorithms.ppo.PPOState", false]], "ppostate (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOState", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOState", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false]], "ppotrainreturnt (in module arlbench.core.algorithms.ppo)": [[17, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false], [43, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false]], "ppotrainstate (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false]], "predict() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.predict", false], [41, "arlbench.core.algorithms.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.predict", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.predict", false], [41, "arlbench.core.algorithms.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.predict", false], [42, "arlbench.core.algorithms.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.ppo method)": [[10, "arlbench.core.algorithms.PPO.predict", false], [41, "arlbench.core.algorithms.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo method)": [[17, "arlbench.core.algorithms.ppo.PPO.predict", false], [43, "arlbench.core.algorithms.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.predict", false], [41, "arlbench.core.algorithms.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.predict", false], [44, "arlbench.core.algorithms.sac.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.predict", false], [44, "arlbench.core.algorithms.sac.sac.SAC.predict", false]], "random search": [[52, "term-Random-Search", true]], "rank (arlbench.autorl.objectives.emissions attribute)": [[39, "arlbench.autorl.objectives.Emissions.RANK", false]], "rank (arlbench.autorl.objectives.objective attribute)": [[39, "arlbench.autorl.objectives.Objective.RANK", false]], "rank (arlbench.autorl.objectives.rewardmean attribute)": [[39, "arlbench.autorl.objectives.RewardMean.RANK", false]], "rank (arlbench.autorl.objectives.rewardstd attribute)": [[39, "arlbench.autorl.objectives.RewardStd.RANK", false]], "rank (arlbench.autorl.objectives.runtime attribute)": [[39, "arlbench.autorl.objectives.Runtime.RANK", false]], "recursive_concat() (in module arlbench.utils)": [[36, "arlbench.utils.recursive_concat", false], [47, "arlbench.utils.recursive_concat", false]], "recursive_concat() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.recursive_concat", false], [47, "arlbench.utils.common.recursive_concat", false]], "replace() (arlbench.core.algorithms.common.timestep method)": [[41, "arlbench.core.algorithms.common.TimeStep.replace", false]], "replace() (arlbench.core.algorithms.dqn.dqn.dqntrainstate method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false]], "replace() (arlbench.core.algorithms.ppo.ppo.ppotrainstate method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false]], "replace() (arlbench.core.algorithms.sac.sac.sactrainstate method)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false]], "replace() (arlbench.core.running_statistics.nestedmeanstd method)": [[32, "arlbench.core.running_statistics.NestedMeanStd.replace", false], [40, "arlbench.core.running_statistics.NestedMeanStd.replace", false]], "replace() (arlbench.core.running_statistics.runningstatisticsstate method)": [[32, "arlbench.core.running_statistics.RunningStatisticsState.replace", false], [40, "arlbench.core.running_statistics.RunningStatisticsState.replace", false]], "reset() (arlbench.autorl.autorl_env.autorlenv method)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false]], "reset() (arlbench.autorl.autorlenv method)": [[4, "arlbench.autorl.AutoRLEnv.reset", false], [39, "arlbench.autorl.AutoRLEnv.reset", false]], "reset() (arlbench.autorlenv method)": [[2, "arlbench.AutoRLEnv.reset", false], [38, "arlbench.AutoRLEnv.reset", false]], "reset() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.reset", false], [45, "arlbench.core.environments.autorl_env.Environment.reset", false]], "reset() (arlbench.core.environments.brax_env.braxenv method)": [[45, "arlbench.core.environments.brax_env.BraxEnv.reset", false]], "reset() (arlbench.core.environments.braxenv method)": [[45, "arlbench.core.environments.BraxEnv.reset", false]], "reset() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.reset", false], [45, "arlbench.core.environments.Environment.reset", false]], "reset() (arlbench.core.environments.envpool_env.envpoolenv method)": [[45, "arlbench.core.environments.envpool_env.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.envpoolenv method)": [[45, "arlbench.core.environments.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnasiumenv method)": [[45, "arlbench.core.environments.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[45, "arlbench.core.environments.gymnax_env.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.gymnaxenv method)": [[45, "arlbench.core.environments.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.xland_env.xlandenv method)": [[45, "arlbench.core.environments.xland_env.XLandEnv.reset", false]], "reset() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false]], "reset() (arlbench.core.wrappers.flattenobservationwrapper method)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false]], "return_buffer (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false]], "return_buffer (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false]], "reward (arlbench.core.algorithms.common.timestep attribute)": [[41, "arlbench.core.algorithms.common.TimeStep.reward", false]], "reward (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false]], "reward (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false]], "reward (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.reward", false], [44, "arlbench.core.algorithms.sac.sac.Transition.reward", false]], "rewardmean (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.RewardMean", false], [39, "arlbench.autorl.objectives.RewardMean", false]], "rewardstd (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.RewardStd", false], [39, "arlbench.autorl.objectives.RewardStd", false]], "rng (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[21, "arlbench.core.algorithms.sac.SACRunnerState.rng", false], [44, "arlbench.core.algorithms.sac.SACRunnerState.rng", false]], "run_arlbench() (in module arlbench)": [[2, "arlbench.run_arlbench", false], [38, "arlbench.run_arlbench", false]], "run_arlbench() (in module arlbench.arlbench)": [[3, "arlbench.arlbench.run_arlbench", false], [38, "arlbench.arlbench.run_arlbench", false]], "runner_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNState.runner_state", false], [42, "arlbench.core.algorithms.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[17, "arlbench.core.algorithms.ppo.PPOState.runner_state", false], [43, "arlbench.core.algorithms.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false], [44, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sacstate attribute)": [[21, "arlbench.core.algorithms.sac.SACState.runner_state", false], [44, "arlbench.core.algorithms.sac.SACState.runner_state", false]], "runningstatisticsstate (class in arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.RunningStatisticsState", false], [40, "arlbench.core.running_statistics.RunningStatisticsState", false]], "runtime (class in arlbench.autorl.objectives)": [[7, "arlbench.autorl.objectives.Runtime", false], [39, "arlbench.autorl.objectives.Runtime", false]], "sac": [[52, "term-SAC", true]], "sac (class in arlbench.core.algorithms)": [[10, "arlbench.core.algorithms.SAC", false], [41, "arlbench.core.algorithms.SAC", false]], "sac (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SAC", false], [44, "arlbench.core.algorithms.sac.SAC", false]], "sac (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SAC", false], [44, "arlbench.core.algorithms.sac.sac.SAC", false]], "saccnnactor (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACCNNActor", false], [44, "arlbench.core.algorithms.sac.models.SACCNNActor", false]], "saccnncritic (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACCNNCritic", false], [44, "arlbench.core.algorithms.sac.models.SACCNNCritic", false]], "sacmetrics (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACMetrics", false], [44, "arlbench.core.algorithms.sac.SACMetrics", false]], "sacmetrics (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics", false]], "sacmlpactor (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACMLPActor", false], [44, "arlbench.core.algorithms.sac.models.SACMLPActor", false]], "sacmlpcritic (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACMLPCritic", false], [44, "arlbench.core.algorithms.sac.models.SACMLPCritic", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACRunnerState", false], [44, "arlbench.core.algorithms.sac.SACRunnerState", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACRunnerState", false], [44, "arlbench.core.algorithms.sac.sac.SACRunnerState", false]], "sacstate (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACState", false], [44, "arlbench.core.algorithms.sac.SACState", false]], "sacstate (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACState", false], [44, "arlbench.core.algorithms.sac.sac.SACState", false]], "sactrainingresult (class in arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult", false]], "sactrainingresult (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false]], "sactrainreturnt (in module arlbench.core.algorithms.sac)": [[21, "arlbench.core.algorithms.sac.SACTrainReturnT", false], [44, "arlbench.core.algorithms.sac.SACTrainReturnT", false]], "sactrainstate (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainState", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainState", false]], "sacvectorcritic (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.SACVectorCritic", false], [44, "arlbench.core.algorithms.sac.models.SACVectorCritic", false]], "sample_action() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[45, "arlbench.core.environments.gymnax_env.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.gymnaxenv method)": [[45, "arlbench.core.environments.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.xland_env.xlandenv method)": [[45, "arlbench.core.environments.xland_env.XLandEnv.sample_action", false]], "sample_actions() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.sample_actions", false], [45, "arlbench.core.environments.autorl_env.Environment.sample_actions", false]], "sample_actions() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.sample_actions", false], [45, "arlbench.core.environments.Environment.sample_actions", false]], "save() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.save", false], [39, "arlbench.autorl.checkpointing.Checkpointer.save", false]], "save_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[6, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false], [39, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false]], "save_defaults_to_yaml() (in module arlbench.utils)": [[36, "arlbench.utils.save_defaults_to_yaml", false], [47, "arlbench.utils.save_defaults_to_yaml", false]], "save_defaults_to_yaml() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.save_defaults_to_yaml", false], [47, "arlbench.utils.common.save_defaults_to_yaml", false]], "scalars_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[39, "arlbench.autorl.checkpointing.Checkpointer.SCALARS_FILE", false]], "scope (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[42, "arlbench.core.algorithms.dqn.models.CNNQ.scope", false]], "scope (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[42, "arlbench.core.algorithms.dqn.models.MLPQ.scope", false]], "scope (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.scope", false]], "scope (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[44, "arlbench.core.algorithms.sac.models.AlphaCoef.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACCNNCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACMLPCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[44, "arlbench.core.algorithms.sac.models.SACVectorCritic.scope", false]], "setup() (arlbench.core.algorithms.dqn.models.cnnq method)": [[16, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false], [42, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false]], "setup() (arlbench.core.algorithms.dqn.models.mlpq method)": [[16, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false], [42, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false], [43, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[18, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false], [43, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.alphacoef method)": [[22, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false], [44, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false], [44, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[22, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false], [44, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false], [44, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[22, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false], [44, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false]], "statefeature (class in arlbench.autorl.state_features)": [[8, "arlbench.autorl.state_features.StateFeature", false], [39, "arlbench.autorl.state_features.StateFeature", false]], "std (arlbench.core.running_statistics.nestedmeanstd attribute)": [[40, "arlbench.core.running_statistics.NestedMeanStd.std", false]], "step() (arlbench.autorl.autorl_env.autorlenv method)": [[5, "arlbench.autorl.autorl_env.AutoRLEnv.step", false], [39, "arlbench.autorl.autorl_env.AutoRLEnv.step", false]], "step() (arlbench.autorl.autorlenv method)": [[4, "arlbench.autorl.AutoRLEnv.step", false], [39, "arlbench.autorl.AutoRLEnv.step", false]], "step() (arlbench.autorlenv method)": [[2, "arlbench.AutoRLEnv.step", false], [38, "arlbench.AutoRLEnv.step", false]], "step() (arlbench.core.environments.autorl_env.environment method)": [[25, "arlbench.core.environments.autorl_env.Environment.step", false], [45, "arlbench.core.environments.autorl_env.Environment.step", false]], "step() (arlbench.core.environments.brax_env.braxenv method)": [[45, "arlbench.core.environments.brax_env.BraxEnv.step", false]], "step() (arlbench.core.environments.braxenv method)": [[45, "arlbench.core.environments.BraxEnv.step", false]], "step() (arlbench.core.environments.environment method)": [[24, "arlbench.core.environments.Environment.step", false], [45, "arlbench.core.environments.Environment.step", false]], "step() (arlbench.core.environments.envpool_env.envpoolenv method)": [[45, "arlbench.core.environments.envpool_env.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.envpoolenv method)": [[45, "arlbench.core.environments.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[45, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnasiumenv method)": [[45, "arlbench.core.environments.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[45, "arlbench.core.environments.gymnax_env.GymnaxEnv.step", false]], "step() (arlbench.core.environments.gymnaxenv method)": [[45, "arlbench.core.environments.GymnaxEnv.step", false]], "step() (arlbench.core.environments.xland_env.xlandenv method)": [[45, "arlbench.core.environments.xland_env.XLandEnv.step", false]], "step() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[34, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false], [46, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false]], "step() (arlbench.core.wrappers.flattenobservationwrapper method)": [[33, "arlbench.core.wrappers.FlattenObservationWrapper.step", false], [46, "arlbench.core.wrappers.FlattenObservationWrapper.step", false]], "summed_variance (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[40, "arlbench.core.running_statistics.RunningStatisticsState.summed_variance", false]], "tanhtransformeddistribution (class in arlbench.core.algorithms.sac.models)": [[22, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false], [44, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false]], "target_params (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[42, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.target_params", false]], "target_params (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[44, "arlbench.core.algorithms.sac.sac.SACTrainState.target_params", false]], "td_error (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[14, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false], [42, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false], [44, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sacmetrics attribute)": [[21, "arlbench.core.algorithms.sac.SACMetrics.td_error", false], [44, "arlbench.core.algorithms.sac.SACMetrics.td_error", false]], "timestep (class in arlbench.core.algorithms.common)": [[13, "arlbench.core.algorithms.common.TimeStep", false], [41, "arlbench.core.algorithms.common.TimeStep", false]], "to_tuple() (arlbench.core.algorithms.common.timestep method)": [[41, "arlbench.core.algorithms.common.TimeStep.to_tuple", false]], "train() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.train", false], [41, "arlbench.core.algorithms.Algorithm.train", false]], "train() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.train", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.train", false]], "train() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.train", false], [41, "arlbench.core.algorithms.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.train", false], [42, "arlbench.core.algorithms.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.train", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.ppo method)": [[10, "arlbench.core.algorithms.PPO.train", false], [41, "arlbench.core.algorithms.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo method)": [[17, "arlbench.core.algorithms.ppo.PPO.train", false], [43, "arlbench.core.algorithms.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[19, "arlbench.core.algorithms.ppo.ppo.PPO.train", false], [43, "arlbench.core.algorithms.ppo.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.train", false], [41, "arlbench.core.algorithms.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.train", false], [44, "arlbench.core.algorithms.sac.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.train", false], [44, "arlbench.core.algorithms.sac.sac.SAC.train", false]], "train_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[14, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false], [42, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false], [43, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[17, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false], [43, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false]], "trajectories (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[15, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false], [42, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[14, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false], [42, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false], [43, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[17, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false], [43, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[23, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false], [44, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[21, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false], [44, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false]], "transition (class in arlbench.core.algorithms.dqn.dqn)": [[15, "arlbench.core.algorithms.dqn.dqn.Transition", false], [42, "arlbench.core.algorithms.dqn.dqn.Transition", false]], "transition (class in arlbench.core.algorithms.ppo.ppo)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition", false]], "transition (class in arlbench.core.algorithms.sac.sac)": [[23, "arlbench.core.algorithms.sac.sac.Transition", false], [44, "arlbench.core.algorithms.sac.sac.Transition", false]], "tuple_concat() (in module arlbench.utils)": [[36, "arlbench.utils.tuple_concat", false], [47, "arlbench.utils.tuple_concat", false]], "tuple_concat() (in module arlbench.utils.common)": [[37, "arlbench.utils.common.tuple_concat", false], [47, "arlbench.utils.common.tuple_concat", false]], "uniform_sample() (in module arlbench.core.algorithms.buffers)": [[12, "arlbench.core.algorithms.buffers.uniform_sample", false], [41, "arlbench.core.algorithms.buffers.uniform_sample", false]], "update() (arlbench.core.algorithms.dqn method)": [[10, "arlbench.core.algorithms.DQN.update", false], [41, "arlbench.core.algorithms.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn method)": [[14, "arlbench.core.algorithms.dqn.DQN.update", false], [42, "arlbench.core.algorithms.dqn.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[15, "arlbench.core.algorithms.dqn.dqn.DQN.update", false], [42, "arlbench.core.algorithms.dqn.dqn.DQN.update", false]], "update() (in module arlbench.core.running_statistics)": [[32, "arlbench.core.running_statistics.update", false], [40, "arlbench.core.running_statistics.update", false]], "update_actor() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.update_actor", false], [41, "arlbench.core.algorithms.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.update_actor", false], [44, "arlbench.core.algorithms.sac.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false], [44, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false]], "update_alpha() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.update_alpha", false], [41, "arlbench.core.algorithms.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.update_alpha", false], [44, "arlbench.core.algorithms.sac.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false], [44, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false]], "update_critic() (arlbench.core.algorithms.sac method)": [[10, "arlbench.core.algorithms.SAC.update_critic", false], [41, "arlbench.core.algorithms.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac method)": [[21, "arlbench.core.algorithms.sac.SAC.update_critic", false], [44, "arlbench.core.algorithms.sac.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac.sac method)": [[23, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false], [44, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm method)": [[10, "arlbench.core.algorithms.Algorithm.update_hpo_config", false], [41, "arlbench.core.algorithms.Algorithm.update_hpo_config", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm.algorithm method)": [[11, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false], [41, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false]], "value (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[19, "arlbench.core.algorithms.ppo.ppo.Transition.value", false], [43, "arlbench.core.algorithms.ppo.ppo.Transition.value", false]], "value (arlbench.core.algorithms.sac.sac.transition attribute)": [[23, "arlbench.core.algorithms.sac.sac.Transition.value", false], [44, "arlbench.core.algorithms.sac.sac.Transition.value", false]], "values() (arlbench.core.algorithms.common.timestep method)": [[13, "arlbench.core.algorithms.common.TimeStep.values", false], [41, "arlbench.core.algorithms.common.TimeStep.values", false]], "wrapper (class in arlbench.core.wrappers)": [[33, "arlbench.core.wrappers.Wrapper", false], [46, "arlbench.core.wrappers.Wrapper", false]], "wrapper (class in arlbench.core.wrappers.wrapper)": [[35, "arlbench.core.wrappers.wrapper.Wrapper", false], [46, "arlbench.core.wrappers.wrapper.Wrapper", false]], "xlandenv (class in arlbench.core.environments.xland_env)": [[31, "arlbench.core.environments.xland_env.XLandEnv", false], [45, "arlbench.core.environments.xland_env.XLandEnv", false]]}, "objects": {"": [[38, 0, 0, "-", "arlbench"]], "arlbench": [[38, 1, 1, "", "AutoRLEnv"], [38, 0, 0, "-", "arlbench"], [39, 0, 0, "-", "autorl"], [40, 0, 0, "-", "core"], [38, 5, 1, "", "run_arlbench"], [47, 0, 0, "-", "utils"]], "arlbench.AutoRLEnv": [[38, 2, 1, "", "ALGORITHMS"], [38, 3, 1, "", "action_space"], [38, 3, 1, "", "checkpoints"], [38, 3, 1, "", "config"], [38, 3, 1, "", "config_space"], [38, 4, 1, "", "eval"], [38, 3, 1, "", "hpo_config"], [38, 3, 1, "", "objectives"], [38, 3, 1, "", "observation_space"], [38, 4, 1, "", "reset"], [38, 4, 1, "", "step"]], "arlbench.arlbench": [[38, 5, 1, "", "run_arlbench"]], "arlbench.autorl": [[39, 1, 1, "", "AutoRLEnv"], [39, 0, 0, "-", "autorl_env"], [39, 0, 0, "-", "checkpointing"], [39, 0, 0, "-", "objectives"], [39, 0, 0, "-", "state_features"]], "arlbench.autorl.AutoRLEnv": [[39, 2, 1, "", "ALGORITHMS"], [39, 3, 1, "", "action_space"], [39, 3, 1, "", "checkpoints"], [39, 3, 1, "", "config"], [39, 3, 1, "", "config_space"], [39, 4, 1, "", "eval"], [39, 3, 1, "", "hpo_config"], [39, 3, 1, "", "objectives"], [39, 3, 1, "", "observation_space"], [39, 4, 1, "", "reset"], [39, 4, 1, "", "step"]], "arlbench.autorl.autorl_env": [[39, 1, 1, "", "AutoRLEnv"]], "arlbench.autorl.autorl_env.AutoRLEnv": [[39, 2, 1, "", "ALGORITHMS"], [39, 3, 1, "", "action_space"], [39, 3, 1, "", "checkpoints"], [39, 3, 1, "", "config"], [39, 3, 1, "", "config_space"], [39, 4, 1, "", "eval"], [39, 3, 1, "", "hpo_config"], [39, 3, 1, "", "objectives"], [39, 3, 1, "", "observation_space"], [39, 4, 1, "", "reset"], [39, 4, 1, "", "step"]], "arlbench.autorl.checkpointing": [[39, 1, 1, "", "Checkpointer"]], "arlbench.autorl.checkpointing.Checkpointer": [[39, 2, 1, "", "MRP_FILE"], [39, 2, 1, "", "NODES_FILE"], [39, 2, 1, "", "SCALARS_FILE"], [39, 4, 1, "", "load"], [39, 4, 1, "", "load_buffer"], [39, 4, 1, "", "save"], [39, 4, 1, "", "save_buffer"]], "arlbench.autorl.objectives": [[39, 1, 1, "", "Emissions"], [39, 1, 1, "", "Objective"], [39, 1, 1, "", "RewardMean"], [39, 1, 1, "", "RewardStd"], [39, 1, 1, "", "Runtime"]], "arlbench.autorl.objectives.Emissions": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Objective": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "__lt__"], [39, 4, 1, "", "__new__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardMean": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardStd": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Runtime": [[39, 2, 1, "", "KEY"], [39, 2, 1, "", "RANK"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_spec"]], "arlbench.autorl.state_features": [[39, 1, 1, "", "GradInfo"], [39, 1, 1, "", "StateFeature"]], "arlbench.autorl.state_features.GradInfo": [[39, 2, 1, "", "KEY"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "get_state_space"]], "arlbench.autorl.state_features.StateFeature": [[39, 2, 1, "", "KEY"], [39, 4, 1, "", "__call__"], [39, 4, 1, "", "__new__"], [39, 4, 1, "", "get_state_space"]], "arlbench.core": [[41, 0, 0, "-", "algorithms"], [45, 0, 0, "-", "environments"], [40, 0, 0, "-", "running_statistics"], [46, 0, 0, "-", "wrappers"]], "arlbench.core.algorithms": [[41, 1, 1, "", "Algorithm"], [41, 1, 1, "", "DQN"], [41, 1, 1, "", "PPO"], [41, 1, 1, "", "SAC"], [41, 0, 0, "-", "algorithm"], [41, 0, 0, "-", "buffers"], [41, 0, 0, "-", "common"], [42, 0, 0, "-", "dqn"], [43, 0, 0, "-", "ppo"], [41, 0, 0, "-", "prioritised_item_buffer"], [44, 0, 0, "-", "sac"]], "arlbench.core.algorithms.Algorithm": [[41, 3, 1, "", "action_type"], [41, 4, 1, "", "eval"], [41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.DQN": [[41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update"]], "arlbench.core.algorithms.PPO": [[41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"]], "arlbench.core.algorithms.SAC": [[41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update_actor"], [41, 4, 1, "", "update_alpha"], [41, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.algorithm": [[41, 1, 1, "", "Algorithm"]], "arlbench.core.algorithms.algorithm.Algorithm": [[41, 3, 1, "", "action_type"], [41, 4, 1, "", "eval"], [41, 4, 1, "", "get_checkpoint_factory"], [41, 4, 1, "", "get_default_hpo_config"], [41, 4, 1, "", "get_default_nas_config"], [41, 4, 1, "", "get_hpo_config_space"], [41, 4, 1, "", "get_hpo_search_space"], [41, 4, 1, "", "get_nas_config_space"], [41, 4, 1, "", "init"], [41, 2, 1, "", "name"], [41, 4, 1, "", "predict"], [41, 4, 1, "", "train"], [41, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.buffers": [[41, 5, 1, "", "uniform_sample"]], "arlbench.core.algorithms.common": [[41, 1, 1, "", "TimeStep"]], "arlbench.core.algorithms.common.TimeStep": [[41, 2, 1, "", "action"], [41, 2, 1, "", "done"], [41, 4, 1, "", "from_tuple"], [41, 4, 1, "", "items"], [41, 4, 1, "", "keys"], [41, 2, 1, "", "last_obs"], [41, 2, 1, "", "obs"], [41, 4, 1, "", "replace"], [41, 2, 1, "", "reward"], [41, 4, 1, "", "to_tuple"], [41, 4, 1, "", "values"]], "arlbench.core.algorithms.dqn": [[42, 1, 1, "", "DQN"], [42, 1, 1, "", "DQNMetrics"], [42, 1, 1, "", "DQNRunnerState"], [42, 1, 1, "", "DQNState"], [42, 2, 1, "", "DQNTrainReturnT"], [42, 1, 1, "", "DQNTrainingResult"], [42, 0, 0, "-", "dqn"], [42, 0, 0, "-", "models"]], "arlbench.core.algorithms.dqn.DQN": [[42, 4, 1, "", "get_checkpoint_factory"], [42, 4, 1, "", "get_default_hpo_config"], [42, 4, 1, "", "get_default_nas_config"], [42, 4, 1, "", "get_hpo_config_space"], [42, 4, 1, "", "get_hpo_search_space"], [42, 4, 1, "", "get_nas_config_space"], [42, 4, 1, "", "init"], [42, 2, 1, "", "name"], [42, 4, 1, "", "predict"], [42, 4, 1, "", "train"], [42, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.DQNMetrics": [[42, 2, 1, "", "grads"], [42, 2, 1, "", "loss"], [42, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.DQNRunnerState": [[42, 2, 1, "", "env_state"], [42, 2, 1, "", "global_step"], [42, 2, 1, "", "normalizer_state"], [42, 2, 1, "", "obs"], [42, 2, 1, "", "rng"], [42, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.DQNState": [[42, 2, 1, "", "buffer_state"], [42, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.DQNTrainingResult": [[42, 2, 1, "", "eval_rewards"], [42, 2, 1, "", "metrics"], [42, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn": [[42, 1, 1, "", "DQN"], [42, 1, 1, "", "DQNMetrics"], [42, 1, 1, "", "DQNRunnerState"], [42, 1, 1, "", "DQNState"], [42, 1, 1, "", "DQNTrainState"], [42, 1, 1, "", "DQNTrainingResult"], [42, 1, 1, "", "Transition"]], "arlbench.core.algorithms.dqn.dqn.DQN": [[42, 4, 1, "", "get_checkpoint_factory"], [42, 4, 1, "", "get_default_hpo_config"], [42, 4, 1, "", "get_default_nas_config"], [42, 4, 1, "", "get_hpo_config_space"], [42, 4, 1, "", "get_hpo_search_space"], [42, 4, 1, "", "get_nas_config_space"], [42, 4, 1, "", "init"], [42, 2, 1, "", "name"], [42, 4, 1, "", "predict"], [42, 4, 1, "", "train"], [42, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.dqn.DQNMetrics": [[42, 2, 1, "", "grads"], [42, 2, 1, "", "loss"], [42, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.dqn.DQNRunnerState": [[42, 2, 1, "", "env_state"], [42, 2, 1, "", "global_step"], [42, 2, 1, "", "normalizer_state"], [42, 2, 1, "", "obs"], [42, 2, 1, "", "rng"], [42, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.dqn.DQNState": [[42, 2, 1, "", "buffer_state"], [42, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainState": [[42, 4, 1, "", "create_with_opt_state"], [42, 2, 1, "", "opt_state"], [42, 4, 1, "", "replace"], [42, 2, 1, "", "target_params"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult": [[42, 2, 1, "", "eval_rewards"], [42, 2, 1, "", "metrics"], [42, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn.Transition": [[42, 2, 1, "", "action"], [42, 2, 1, "", "done"], [42, 2, 1, "", "info"], [42, 2, 1, "", "obs"], [42, 2, 1, "", "reward"]], "arlbench.core.algorithms.dqn.models": [[42, 1, 1, "", "CNNQ"], [42, 1, 1, "", "MLPQ"]], "arlbench.core.algorithms.dqn.models.CNNQ": [[42, 4, 1, "", "__call__"], [42, 2, 1, "", "action_dim"], [42, 2, 1, "", "activation"], [42, 2, 1, "", "discrete"], [42, 2, 1, "", "hidden_size"], [42, 2, 1, "", "name"], [42, 2, 1, "", "parent"], [42, 2, 1, "", "scope"], [42, 4, 1, "", "setup"]], "arlbench.core.algorithms.dqn.models.MLPQ": [[42, 4, 1, "", "__call__"], [42, 2, 1, "", "action_dim"], [42, 2, 1, "", "activation"], [42, 2, 1, "", "discrete"], [42, 2, 1, "", "hidden_size"], [42, 2, 1, "", "name"], [42, 2, 1, "", "parent"], [42, 2, 1, "", "scope"], [42, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo": [[43, 1, 1, "", "PPO"], [43, 1, 1, "", "PPOMetrics"], [43, 1, 1, "", "PPORunnerState"], [43, 1, 1, "", "PPOState"], [43, 2, 1, "", "PPOTrainReturnT"], [43, 1, 1, "", "PPOTrainingResult"], [43, 0, 0, "-", "models"], [43, 0, 0, "-", "ppo"]], "arlbench.core.algorithms.ppo.PPO": [[43, 4, 1, "", "get_checkpoint_factory"], [43, 4, 1, "", "get_default_hpo_config"], [43, 4, 1, "", "get_default_nas_config"], [43, 4, 1, "", "get_hpo_config_space"], [43, 4, 1, "", "get_hpo_search_space"], [43, 4, 1, "", "get_nas_config_space"], [43, 4, 1, "", "init"], [43, 2, 1, "", "name"], [43, 4, 1, "", "predict"], [43, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.PPOMetrics": [[43, 2, 1, "", "advantages"], [43, 2, 1, "", "grads"], [43, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.PPORunnerState": [[43, 2, 1, "", "cur_rewards"], [43, 2, 1, "", "env_state"], [43, 2, 1, "", "global_step"], [43, 2, 1, "", "normalizer_state"], [43, 2, 1, "", "obs"], [43, 2, 1, "", "return_buffer"], [43, 2, 1, "", "return_buffer_idx"], [43, 2, 1, "", "rng"], [43, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.PPOState": [[43, 2, 1, "", "buffer_state"], [43, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.PPOTrainingResult": [[43, 2, 1, "", "eval_rewards"], [43, 2, 1, "", "metrics"], [43, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.models": [[43, 1, 1, "", "CNNActorCritic"], [43, 1, 1, "", "MLPActorCritic"]], "arlbench.core.algorithms.ppo.models.CNNActorCritic": [[43, 4, 1, "", "__call__"], [43, 2, 1, "", "action_dim"], [43, 2, 1, "", "activation"], [43, 2, 1, "", "discrete"], [43, 2, 1, "", "hidden_size"], [43, 2, 1, "", "name"], [43, 2, 1, "", "parent"], [43, 2, 1, "", "scope"], [43, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.models.MLPActorCritic": [[43, 4, 1, "", "__call__"], [43, 2, 1, "", "action_dim"], [43, 2, 1, "", "activation"], [43, 2, 1, "", "discrete"], [43, 2, 1, "", "hidden_size"], [43, 2, 1, "", "name"], [43, 2, 1, "", "parent"], [43, 2, 1, "", "scope"], [43, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.ppo": [[43, 1, 1, "", "PPO"], [43, 1, 1, "", "PPOMetrics"], [43, 1, 1, "", "PPORunnerState"], [43, 1, 1, "", "PPOState"], [43, 1, 1, "", "PPOTrainState"], [43, 1, 1, "", "PPOTrainingResult"], [43, 1, 1, "", "Transition"]], "arlbench.core.algorithms.ppo.ppo.PPO": [[43, 4, 1, "", "get_checkpoint_factory"], [43, 4, 1, "", "get_default_hpo_config"], [43, 4, 1, "", "get_default_nas_config"], [43, 4, 1, "", "get_hpo_config_space"], [43, 4, 1, "", "get_hpo_search_space"], [43, 4, 1, "", "get_nas_config_space"], [43, 4, 1, "", "init"], [43, 2, 1, "", "name"], [43, 4, 1, "", "predict"], [43, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.ppo.PPOMetrics": [[43, 2, 1, "", "advantages"], [43, 2, 1, "", "grads"], [43, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.ppo.PPORunnerState": [[43, 2, 1, "", "cur_rewards"], [43, 2, 1, "", "env_state"], [43, 2, 1, "", "global_step"], [43, 2, 1, "", "normalizer_state"], [43, 2, 1, "", "obs"], [43, 2, 1, "", "return_buffer"], [43, 2, 1, "", "return_buffer_idx"], [43, 2, 1, "", "rng"], [43, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.ppo.PPOState": [[43, 2, 1, "", "buffer_state"], [43, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainState": [[43, 4, 1, "", "create_with_opt_state"], [43, 2, 1, "", "opt_state"], [43, 4, 1, "", "replace"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult": [[43, 2, 1, "", "eval_rewards"], [43, 2, 1, "", "metrics"], [43, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.ppo.Transition": [[43, 2, 1, "", "action"], [43, 2, 1, "", "done"], [43, 2, 1, "", "info"], [43, 2, 1, "", "log_prob"], [43, 2, 1, "", "obs"], [43, 2, 1, "", "reward"], [43, 2, 1, "", "value"]], "arlbench.core.algorithms.prioritised_item_buffer": [[41, 5, 1, "", "create_prioritised_item_buffer"], [41, 5, 1, "", "make_prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[44, 1, 1, "", "SAC"], [44, 1, 1, "", "SACMetrics"], [44, 1, 1, "", "SACRunnerState"], [44, 1, 1, "", "SACState"], [44, 2, 1, "", "SACTrainReturnT"], [44, 1, 1, "", "SACTrainingResult"], [44, 0, 0, "-", "models"], [44, 0, 0, "-", "sac"]], "arlbench.core.algorithms.sac.SAC": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_actor"], [44, 4, 1, "", "update_alpha"], [44, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.SACMetrics": [[44, 2, 1, "", "actor_grads"], [44, 2, 1, "", "actor_loss"], [44, 2, 1, "", "alpha_loss"], [44, 2, 1, "", "critic_grads"], [44, 2, 1, "", "critic_loss"], [44, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.SACRunnerState": [[44, 2, 1, "", "actor_train_state"], [44, 2, 1, "", "alpha_train_state"], [44, 2, 1, "", "critic_train_state"], [44, 2, 1, "", "env_state"], [44, 2, 1, "", "global_step"], [44, 2, 1, "", "normalizer_state"], [44, 2, 1, "", "obs"], [44, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.SACState": [[44, 2, 1, "", "buffer_state"], [44, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.SACTrainingResult": [[44, 2, 1, "", "eval_rewards"], [44, 2, 1, "", "metrics"], [44, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.models": [[44, 1, 1, "", "AlphaCoef"], [44, 1, 1, "", "SACCNNActor"], [44, 1, 1, "", "SACCNNCritic"], [44, 1, 1, "", "SACMLPActor"], [44, 1, 1, "", "SACMLPCritic"], [44, 1, 1, "", "SACVectorCritic"], [44, 1, 1, "", "TanhTransformedDistribution"]], "arlbench.core.algorithms.sac.models.AlphaCoef": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "alpha_init"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNActor": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "log_std_max"], [44, 2, 1, "", "log_std_min"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNCritic": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPActor": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "log_std_max"], [44, 2, 1, "", "log_std_min"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPCritic": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"], [44, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACVectorCritic": [[44, 4, 1, "", "__call__"], [44, 2, 1, "", "action_dim"], [44, 2, 1, "", "activation"], [44, 2, 1, "", "critic"], [44, 2, 1, "", "hidden_size"], [44, 2, 1, "", "n_critics"], [44, 2, 1, "", "name"], [44, 2, 1, "", "parent"], [44, 2, 1, "", "scope"]], "arlbench.core.algorithms.sac.models.TanhTransformedDistribution": [[44, 4, 1, "", "mode"]], "arlbench.core.algorithms.sac.sac": [[44, 1, 1, "", "SAC"], [44, 1, 1, "", "SACMetrics"], [44, 1, 1, "", "SACRunnerState"], [44, 1, 1, "", "SACState"], [44, 1, 1, "", "SACTrainState"], [44, 1, 1, "", "SACTrainingResult"], [44, 1, 1, "", "Transition"]], "arlbench.core.algorithms.sac.sac.SAC": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_actor"], [44, 4, 1, "", "update_alpha"], [44, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.sac.SACMetrics": [[44, 2, 1, "", "actor_grads"], [44, 2, 1, "", "actor_loss"], [44, 2, 1, "", "alpha_loss"], [44, 2, 1, "", "critic_grads"], [44, 2, 1, "", "critic_loss"], [44, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.sac.SACRunnerState": [[44, 2, 1, "", "actor_train_state"], [44, 2, 1, "", "alpha_train_state"], [44, 2, 1, "", "critic_train_state"], [44, 2, 1, "", "env_state"], [44, 2, 1, "", "global_step"], [44, 2, 1, "", "normalizer_state"], [44, 2, 1, "", "obs"], [44, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.sac.SACState": [[44, 2, 1, "", "buffer_state"], [44, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.sac.SACTrainState": [[44, 4, 1, "", "create_with_opt_state"], [44, 2, 1, "", "network_state"], [44, 4, 1, "", "replace"], [44, 2, 1, "", "target_params"]], "arlbench.core.algorithms.sac.sac.SACTrainingResult": [[44, 2, 1, "", "eval_rewards"], [44, 2, 1, "", "metrics"], [44, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.sac.Transition": [[44, 2, 1, "", "action"], [44, 2, 1, "", "done"], [44, 2, 1, "", "info"], [44, 2, 1, "", "obs"], [44, 2, 1, "", "reward"], [44, 2, 1, "", "value"]], "arlbench.core.environments": [[45, 1, 1, "", "BraxEnv"], [45, 1, 1, "", "Environment"], [45, 1, 1, "", "EnvpoolEnv"], [45, 1, 1, "", "GymnasiumEnv"], [45, 1, 1, "", "GymnaxEnv"], [45, 0, 0, "-", "autorl_env"], [45, 0, 0, "-", "brax_env"], [45, 0, 0, "-", "envpool_env"], [45, 0, 0, "-", "gymnasium_env"], [45, 0, 0, "-", "gymnax_env"], [45, 5, 1, "", "make_env"], [45, 0, 0, "-", "make_env"], [45, 0, 0, "-", "xland_env"]], "arlbench.core.environments.BraxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.Environment": [[45, 4, 1, "", "action_space"], [45, 3, 1, "", "env_name"], [45, 3, 1, "", "n_envs"], [45, 4, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_actions"], [45, 4, 1, "", "step"]], "arlbench.core.environments.EnvpoolEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.GymnasiumEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.GymnaxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_action"], [45, 4, 1, "", "step"]], "arlbench.core.environments.autorl_env": [[45, 1, 1, "", "Environment"]], "arlbench.core.environments.autorl_env.Environment": [[45, 4, 1, "", "action_space"], [45, 3, 1, "", "env_name"], [45, 3, 1, "", "n_envs"], [45, 4, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_actions"], [45, 4, 1, "", "step"]], "arlbench.core.environments.brax_env": [[45, 1, 1, "", "BraxEnv"]], "arlbench.core.environments.brax_env.BraxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.envpool_env": [[45, 1, 1, "", "EnvpoolEnv"], [45, 5, 1, "", "numpy_to_jax"]], "arlbench.core.environments.envpool_env.EnvpoolEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.gymnasium_env": [[45, 1, 1, "", "GymnasiumEnv"]], "arlbench.core.environments.gymnasium_env.GymnasiumEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "step"]], "arlbench.core.environments.gymnax_env": [[45, 1, 1, "", "GymnaxEnv"]], "arlbench.core.environments.gymnax_env.GymnaxEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_action"], [45, 4, 1, "", "step"]], "arlbench.core.environments.make_env": [[45, 5, 1, "", "make_env"]], "arlbench.core.environments.xland_env": [[45, 1, 1, "", "XLandEnv"]], "arlbench.core.environments.xland_env.XLandEnv": [[45, 3, 1, "", "action_space"], [45, 3, 1, "", "observation_space"], [45, 4, 1, "", "reset"], [45, 4, 1, "", "sample_action"], [45, 4, 1, "", "step"]], "arlbench.core.running_statistics": [[40, 1, 1, "", "NestedMeanStd"], [40, 1, 1, "", "RunningStatisticsState"], [40, 5, 1, "", "denormalize"], [40, 5, 1, "", "init_state"], [40, 5, 1, "", "normalize"], [40, 5, 1, "", "update"]], "arlbench.core.running_statistics.NestedMeanStd": [[40, 2, 1, "", "mean"], [40, 4, 1, "", "replace"], [40, 2, 1, "", "std"]], "arlbench.core.running_statistics.RunningStatisticsState": [[40, 2, 1, "", "count"], [40, 4, 1, "", "replace"], [40, 2, 1, "", "summed_variance"]], "arlbench.core.wrappers": [[46, 1, 1, "", "FlattenObservationWrapper"], [46, 1, 1, "", "Wrapper"], [46, 0, 0, "-", "flatten_observation"], [46, 0, 0, "-", "wrapper"]], "arlbench.core.wrappers.FlattenObservationWrapper": [[46, 3, 1, "", "observation_space"], [46, 4, 1, "", "reset"], [46, 4, 1, "", "step"]], "arlbench.core.wrappers.flatten_observation": [[46, 1, 1, "", "FlattenObservationWrapper"]], "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper": [[46, 3, 1, "", "observation_space"], [46, 4, 1, "", "reset"], [46, 4, 1, "", "step"]], "arlbench.core.wrappers.wrapper": [[46, 1, 1, "", "Wrapper"]], "arlbench.utils": [[47, 0, 0, "-", "common"], [47, 5, 1, "", "config_space_to_gymnasium_space"], [47, 5, 1, "", "config_space_to_yaml"], [47, 5, 1, "", "gymnasium_space_to_gymnax_space"], [47, 5, 1, "", "recursive_concat"], [47, 5, 1, "", "save_defaults_to_yaml"], [47, 5, 1, "", "tuple_concat"]], "arlbench.utils.common": [[47, 5, 1, "", "config_space_to_gymnasium_space"], [47, 5, 1, "", "config_space_to_yaml"], [47, 5, 1, "", "gymnasium_space_to_gymnax_space"], [47, 5, 1, "", "recursive_concat"], [47, 5, 1, "", "save_defaults_to_yaml"], [47, 5, 1, "", "tuple_concat"]]}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "property", "Python property"], "4": ["py", "method", "Python method"], "5": ["py", "function", "Python function"]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:attribute", "3": "py:property", "4": "py:method", "5": "py:function"}, "terms": {"": [2, 3, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 38, 41, 42, 43, 44, 49], "0": [14, 15, 17, 19, 20, 21, 22, 23, 24, 30, 32, 36, 37, 39, 40, 41, 42, 43, 44, 45, 47], "06": [32, 40], "1": [14, 15, 17, 19, 21, 22, 23, 24, 30, 39, 42, 43, 44, 45, 49], "10": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "100": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "1000000": [10, 11, 14, 15, 17, 19, 21, 23, 32, 40, 41, 42, 43, 44], "1e": [32, 40], "2": [14, 15, 17, 19, 21, 22, 23, 32, 39, 40, 42, 43, 44, 49], "20": [22, 44], "24": [32, 40], "3": [14, 15, 17, 19, 21, 23, 42, 43, 44], "31": [32, 40], "4": [14, 15, 17, 19, 21, 23, 42, 43, 44], "5": [14, 15, 17, 19, 21, 23, 42, 43, 44], "512": [16, 18, 22, 42, 43, 44], "6": [17, 19, 20, 21, 23, 41, 43, 44], "64": [16, 18, 22, 42, 43, 44], "64bit": [32, 40], "7": [17, 19, 21, 23, 43, 44], "8": [17, 19, 43], "A": [13, 16, 18, 22, 24, 26, 28, 29, 31, 32, 40, 41, 42, 43, 44, 45, 52], "As": [17, 19, 24, 25, 43, 45], "If": [2, 4, 5, 20, 32, 38, 39, 40, 41], "In": [2, 4, 5, 38, 39], "It": [7, 8, 39, 51], "Not": [10, 14, 15, 21, 23, 41, 42, 44], "The": [6, 10, 11, 16, 18, 20, 22, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 51, 52], "These": [24, 25, 45], "To": [32, 40], "With": [2, 4, 5, 38, 39], "_": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44, 45], "__call__": [7, 8, 16, 18, 22, 38, 39, 41, 42, 43, 44], "__init__": [16, 18, 22, 42, 43, 44], "__lt__": [7, 38, 39], "__new__": [7, 8, 38, 39], "__setattr__": [16, 18, 22, 42, 43, 44], "_description_": [2, 4, 5, 10, 21, 23, 24, 25, 30, 36, 37, 38, 39, 41, 44, 45, 47], "_imag": [32, 40], "_sentinel": [16, 18, 22, 42, 43, 44], "_summary_": [10, 21, 23, 41, 44], "_type_": [36, 37, 47], "abc": [7, 8, 10, 11, 24, 25, 39, 41, 45], "abstract": [7, 8, 10, 11, 24, 25, 39, 41, 45], "access": [16, 18, 22, 42, 43, 44], "accumul": [32, 40], "acm": [32, 40], "across": [17, 19, 43], "act": [20, 41], "action": [2, 4, 5, 10, 11, 13, 14, 15, 17, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46], "action_dim": [16, 18, 22, 41, 42, 43, 44], "action_s": [10, 11, 41], "action_spac": [2, 4, 5, 24, 25, 26, 27, 28, 29, 31, 38, 39, 40, 45, 55], "action_typ": [10, 11, 40, 41], "activ": [16, 18, 22, 41, 42, 43, 44], "actor": [10, 18, 21, 22, 23, 41, 43, 44, 52], "actor_grad": [21, 23, 41, 44], "actor_loss": [10, 21, 23, 41, 44], "actor_network_param": [10, 21, 23, 41, 44], "actor_opt_st": [10, 21, 23, 41, 44], "actor_train_st": [10, 21, 23, 41, 44], "actual": [24, 25, 45, 51], "ad": [20, 41], "adapt": [10, 11, 12, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "add": [20, 41], "add_batch": [20, 41], "add_sequ": [20, 41], "addit": [2, 4, 5, 38, 39], "advantag": [7, 8, 17, 19, 39, 41, 43], "after": [32, 40], "agent": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "algorithm": [2, 4, 5, 6, 24, 25, 36, 37, 38, 39, 40, 45, 47, 52, 55], "algorithm_kw_arg": [6, 39], "algorithm_st": [6, 10, 11, 39, 41], "algorithmst": [6, 39], "alia": [14, 15, 17, 19, 21, 23, 42, 43, 44], "all": [6, 10, 11, 14, 15, 17, 19, 21, 23, 32, 39, 40, 41, 42, 43, 44], "allow": [7, 8, 39], "alpha": [10, 20, 21, 22, 23, 41, 44], "alpha_init": [22, 41, 44], "alpha_loss": [10, 21, 23, 41, 44], "alpha_network_param": [10, 21, 23, 41, 44], "alpha_opt_st": [10, 21, 23, 41, 44], "alpha_train_st": [10, 21, 23, 41, 44], "alphacoef": [22, 41, 44], "also": 51, "alwai": [17, 19, 43, 51], "among": [10, 11, 41], "an": [6, 7, 8, 13, 16, 18, 20, 22, 24, 25, 27, 32, 39, 40, 41, 42, 43, 44, 45, 49, 52], "ani": [6, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 30, 32, 33, 34, 39, 40, 41, 42, 43, 44, 45, 46], "anoth": [16, 18, 22, 42, 43, 44, 49], "append": [6, 39], "appli": [16, 18, 22, 42, 43, 44, 52], "apply_fn": [15, 19, 23, 42, 43, 44], "approxim": 52, "ar": [6, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 32, 33, 34, 39, 40, 41, 42, 43, 44, 46, 51], "architectur": [10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 41, 42, 43, 44, 47], "arg": [7, 8, 22, 39, 44], "argument": [24, 30, 45], "arlbench": 51, "around": [7, 8, 39], "arrai": [2, 4, 5, 14, 15, 17, 19, 21, 22, 23, 24, 25, 27, 32, 38, 39, 40, 41, 42, 43, 44, 45], "assign": [16, 18, 22, 42, 43, 44], "attribut": [6, 16, 18, 22, 39, 42, 43, 44], "autom": [2, 4, 5, 38, 39, 52], "automl": [49, 52], "autorl": [2, 38, 52, 55], "autorl_config": [6, 39], "autorl_env": [38, 40, 55], "autorlenv": [2, 4, 5, 38, 39, 55], "axi": [32, 36, 37, 40, 47], "base": [2, 4, 5, 6, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 44, 45, 46], "baselines3": [18, 22, 43, 44], "basic": [7, 8, 10, 11, 39, 41], "batch": [10, 12, 14, 15, 20, 21, 23, 32, 40, 41, 42, 44], "batch_siz": [12, 41], "bayesian": 52, "befor": [2, 4, 5, 16, 18, 22, 32, 38, 39, 40, 42, 43, 44], "behaviour": [7, 8, 39], "being": [16, 18, 20, 22, 41, 42, 43, 44], "best": 52, "between": [7, 12, 39, 41], "black": 52, "blob": [18, 22, 32, 40, 43, 44], "bo": [49, 52], "bool": [2, 4, 5, 6, 7, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 32, 38, 39, 40, 41, 42, 43, 44, 45], "bool_": [17, 19, 21, 23, 41, 43, 44, 45], "both": [24, 25, 45], "bound": [16, 18, 22, 42, 43, 44], "box": [33, 34, 46, 52], "branch": 51, "brax": [24, 26, 30, 45], "brax_env": [38, 40], "braxenv": [24, 26, 40, 45], "buffer": [6, 10, 11, 14, 15, 17, 19, 20, 38, 39, 40, 42, 43], "buffer_dir": [6, 39], "buffer_st": [6, 10, 11, 14, 15, 17, 19, 21, 23, 39, 41, 42, 43, 44], "c_episod": [6, 39], "c_step": [6, 39], "calcul": [7, 8, 22, 39, 44], "call": [2, 4, 5, 7, 8, 16, 18, 20, 22, 33, 34, 38, 39, 41, 42, 43, 44, 46], "callabl": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "can": [7, 8, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 39, 41, 42, 43, 44, 51, 52], "captur": [13, 41], "carbon": [7, 39], "case": [16, 18, 22, 42, 43, 44], "caus": [16, 18, 22, 42, 43, 44], "caution": 51, "certain": [6, 39], "cfg": [2, 3, 38], "checkpoint": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 41, 42, 43, 44, 55], "checkpoint_dir": [6, 39], "checkpoint_nam": [6, 39], "checkpoint_path": [2, 4, 5, 6, 38, 39], "chex": [10, 11, 12, 14, 15, 17, 19, 21, 23, 33, 34, 41, 42, 43, 44, 46], "chosen": [20, 41], "cl": [7, 8, 39], "class": [2, 4, 5, 6, 7, 8, 10, 11, 13, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 31, 32, 33, 34, 35, 38, 39, 40, 41, 42, 43, 44, 45, 46], "classmethod": [42, 43, 44], "clear": 51, "clearli": 51, "clip": 52, "cnn": [16, 18, 22, 42, 43, 44], "cnn_polici": [10, 14, 15, 17, 19, 21, 23, 24, 30, 31, 41, 42, 43, 44, 45], "cnnactorcrit": [18, 41, 43], "cnnq": [16, 41, 42], "code": [7, 39, 49, 51], "coeffici": [22, 44], "com": [18, 22, 32, 40, 43, 44], "common": [6, 18, 22, 38, 39, 40, 43, 44, 55], "common_gotchas_in_jax": [32, 40], "compact": [16, 18, 22, 42, 43, 44], "compar": [7, 39], "comparison": [7, 39, 51], "compat": [24, 30, 45], "comput": [32, 40], "concat": [36, 37, 47], "concaten": [36, 37, 47], "config": [2, 3, 4, 5, 38, 39, 55], "config_kei": [36, 37, 47], "config_spac": [2, 4, 5, 36, 37, 38, 39, 47, 55], "config_space_to_gymnasium_spac": [36, 37, 38, 47], "config_space_to_yaml": [36, 37, 38, 47], "configspac": [2, 4, 5, 36, 37, 38, 39, 47], "configur": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 38, 39, 41, 42, 43, 44, 47], "configurationspac": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 38, 39, 41, 42, 43, 44, 47], "consid": [32, 40], "consist": [14, 15, 17, 19, 21, 23, 42, 43, 44], "construct": [0, 16, 18, 22, 42, 43, 44, 48, 54], "contain": [6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 32, 39, 40, 41, 42, 43, 44, 45], "content": 55, "conv": [16, 18, 22, 42, 43, 44], "conv1": [16, 18, 22, 42, 43, 44], "converst": [36, 37, 47], "convert": [27, 36, 37, 45, 47], "core": [38, 39, 55], "correctli": 51, "correspond": [32, 40], "count": [32, 38, 40], "cpu": [20, 41], "creat": [2, 4, 5, 7, 8, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 38, 39, 41, 42, 43, 44, 45], "create_prioritised_item_buff": [20, 40, 41], "create_with_opt_st": [41, 42, 43, 44], "critic": [10, 18, 21, 22, 23, 41, 43, 44, 52], "critic_grad": [21, 23, 41, 44], "critic_loss": [10, 21, 23, 41, 44], "critic_network_param": [10, 21, 23, 41, 44], "critic_opt_st": [10, 21, 23, 41, 44], "critic_target_param": [10, 21, 23, 41, 44], "critic_train_st": [10, 21, 23, 41, 44], "cumul": [10, 11, 41], "cur_reward": [17, 19, 41, 43], "current": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "d": [13, 41], "data": [6, 20, 32, 39, 40, 41], "deep": [10, 14, 15, 41, 42, 52], "deepmind": [32, 40], "def": [16, 18, 22, 42, 43, 44], "default": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 32, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47], "defin": [10, 11, 16, 18, 22, 41, 42, 43, 44, 51], "degrad": [32, 40], "denorm": [32, 38, 40], "depend": [20, 32, 40, 41], "determinist": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "deterministic_ev": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "deviat": [7, 32, 39, 40], "devic": [20, 41], "dict": [2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 24, 30, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47], "dict1": [36, 37, 47], "dict2": [36, 37, 47], "dictionari": [6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 39, 41, 42, 43, 44, 47], "differ": [10, 11, 41, 51, 52], "dimens": [32, 40], "directli": [7, 8, 39], "directori": [6, 39], "discret": [10, 11, 16, 18, 41, 42, 43], "disk": [6, 39], "distrax": [22, 44], "distribut": [22, 44], "dlr": [18, 22, 43, 44], "do": [7, 8, 39, 51], "doc": [32, 40], "doe": [16, 17, 18, 19, 22, 42, 43, 44], "doesn": [32, 40], "dolor": 53, "done": [6, 7, 8, 10, 13, 14, 15, 19, 23, 39, 40, 41, 42, 43, 44, 52], "doubl": [32, 40], "dqn": [10, 21, 23, 38, 39, 40, 41, 44, 52], "dqnmetric": [14, 15, 41, 42], "dqnrunnerst": [10, 14, 15, 41, 42], "dqnstate": [10, 14, 15, 41, 42], "dqntrainingresult": [10, 14, 15, 41, 42], "dqntrainreturnt": [10, 14, 15, 41, 42], "dqntrainstat": [10, 14, 15, 41, 42], "dtype": [32, 40], "dummi": [6, 39], "dummy_buffer_st": [6, 39], "dure": [2, 4, 5, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "dynam": [32, 40], "each": [2, 4, 5, 20, 24, 25, 38, 39, 41, 45], "earlier": [32, 40], "either": [16, 18, 22, 42, 43, 44], "element": [32, 36, 37, 40, 47], "emiss": [7, 38, 39], "empti": [2, 4, 5, 38, 39], "en": [32, 40], "enabl": [32, 40, 51], "entropi": [10, 21, 23, 41, 44, 52], "env": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 35, 38, 39, 41, 42, 43, 44, 45, 46], "env_framework": [24, 30, 45], "env_kwarg": [24, 26, 27, 28, 29, 30, 31, 45], "env_nam": [24, 25, 26, 27, 28, 29, 30, 31, 40, 45], "env_stat": [14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "environ": [2, 4, 5, 6, 7, 8, 10, 11, 13, 33, 34, 38, 39, 40, 41, 46, 51, 52], "envpool": [24, 27, 30, 45], "envpool_env": [38, 40], "envpoolenv": [24, 27, 40, 45], "episod": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "equival": [20, 24, 30, 32, 40, 41, 45], "error": [2, 4, 5, 38, 39], "etc": [24, 30, 32, 40, 45], "eval": [2, 4, 5, 10, 11, 38, 39, 40, 41, 55], "eval_env": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "eval_reward": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "evalu": [2, 4, 5, 7, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "evalut": [2, 4, 5, 38, 39], "even": [32, 40], "exisit": 51, "experi": [10, 12, 21, 23, 41, 44, 51], "exploit": 52, "explor": 52, "expon": [20, 41], "extract": [36, 37, 47], "facilit": 51, "factori": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "fals": [10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 31, 41, 42, 43, 44, 45], "featur": [2, 4, 5, 8, 38, 39], "fidel": 52, "field": [14, 15, 17, 19, 21, 23, 32, 40, 42, 43, 44], "file": [32, 36, 37, 40, 47], "final": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "find": [51, 52], "first": [7, 8, 36, 37, 39, 47], "fit": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "flatten": [33, 34, 46], "flatten_observ": [38, 40], "flattenobservationwrapp": [33, 34, 40, 46], "flax": [16, 18, 22, 42, 43, 44], "float": [2, 3, 20, 32, 38, 40, 41, 44], "float32": [32, 40], "follow": [16, 18, 22, 24, 25, 30, 42, 43, 44, 45], "found": 51, "framework": [24, 30, 45, 51], "free": 51, "from": [6, 32, 39, 40, 52], "from_tupl": [40, 41], "frozendict": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "full": [32, 40], "fulli": [24, 25, 45], "function": [3, 7, 8, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 27, 32, 33, 34, 37, 39, 40, 41, 42, 43, 44, 45, 46, 52], "gener": [10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "get_checkpoint_factori": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_default_hpo_config": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_default_nas_config": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_hpo_config_spac": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_hpo_search_spac": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_nas_config_spac": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "get_spec": [7, 38, 39], "get_state_spac": [8, 38, 39], "github": [18, 22, 32, 40, 43, 44], "give": [16, 18, 22, 42, 43, 44], "given": [2, 3, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 32, 33, 34, 38, 40, 41, 42, 43, 44, 45, 46, 52], "global_step": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "glossari": 49, "gpu": [20, 41], "grad": [8, 10, 14, 15, 17, 19, 39, 41, 42, 43], "grad_info": 39, "gradient": [8, 39, 52], "gradinfo": [8, 38, 39], "gymnasium": [2, 4, 5, 24, 25, 28, 30, 36, 37, 38, 39, 45, 47, 51], "gymnasium_env": [38, 40], "gymnasium_space_to_gymnax_spac": [36, 37, 38, 47], "gymnasiumenv": [24, 28, 40, 45], "gymnax": [24, 25, 26, 27, 28, 29, 30, 31, 36, 37, 45, 47], "gymnax_env": [38, 40], "gymnax_spac": [36, 37, 47], "gymnaxenv": [24, 29, 40, 45], "gynasium": [2, 4, 5, 38, 39], "gynmasium": [2, 4, 5, 38, 39], "ha": [24, 30, 45], "happen": [16, 18, 22, 42, 43, 44], "have": [32, 40, 51], "hello": 49, "here": [16, 18, 22, 42, 43, 44, 49], "hidden_s": [16, 18, 22, 41, 42, 43, 44], "hierarchi": [32, 40], "howev": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44, 51], "hp_config": [6, 36, 37, 39, 47], "hp_config_spac": [36, 37, 47], "hpo": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44, 52], "hpo_config": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44, 55], "html": [32, 40], "http": [18, 22, 32, 40, 43, 44, 49], "hyperparamet": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 38, 39, 41, 42, 43, 44, 47, 52], "i": [0, 2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 38, 39, 41, 42, 43, 44, 48, 49, 51, 54], "id": [6, 24, 25, 30, 39, 45], "ideal": 51, "identifi": [6, 39], "imit": [7, 8, 39], "immedi": [16, 18, 22, 42, 43, 44], "impact": [32, 40], "implement": [7, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 39, 41, 42, 43, 44, 45], "improv": [32, 40, 52], "includ": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "independ": [20, 41], "inexact": [32, 40], "info": [15, 19, 23, 41, 42, 43, 44], "inform": [2, 4, 5, 8, 38, 39], "infot": [2, 4, 5, 38, 39], "init": [10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 40, 41, 42, 43, 44], "init_and_output": [16, 18, 22, 42, 43, 44], "init_st": [32, 38, 40], "initi": [2, 4, 5, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 32, 38, 39, 40, 41, 42, 43, 44], "insid": [16, 18, 22, 42, 43, 44], "instal": 49, "instanc": [7, 8, 16, 18, 22, 39, 42, 43, 44], "int": [2, 4, 5, 6, 10, 11, 12, 14, 15, 17, 19, 20, 21, 23, 24, 25, 30, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47], "int32": [32, 40], "integ": [32, 40], "interact": [13, 41], "intern": [24, 25, 33, 34, 45, 46], "interv": [12, 41], "invok": [16, 18, 22, 42, 43, 44], "io": [32, 40], "ipsum": 53, "is_weight": [10, 14, 15, 21, 23, 41, 42, 44], "item": [13, 20, 40, 41, 49], "iter": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "its": [2, 4, 5, 33, 34, 38, 39, 46, 52], "jax": [10, 14, 15, 17, 19, 21, 23, 24, 25, 27, 30, 32, 40, 41, 42, 43, 44, 45], "jax_enable_x64": [32, 40], "jit": [32, 40, 51], "jittabl": [24, 25, 45], "jnp": [10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 32, 33, 34, 40, 41, 42, 43, 44, 45, 46], "json": 39, "keep": [7, 8, 39], "kei": [10, 11, 12, 13, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "kept": [17, 19, 43], "keyword": [24, 30, 45], "kind": [24, 25, 45], "know": [6, 39], "kwarg": [7, 8, 22, 39, 41, 42, 43, 44], "l48": [18, 22, 43, 44], "larg": [32, 40], "last": [6, 7, 39], "last_ob": [13, 40, 41], "latest": [32, 40], "lazi": [16, 18, 22, 42, 43, 44], "lazili": [16, 18, 22, 42, 43, 44], "learn": [2, 4, 5, 10, 11, 38, 39, 41, 52], "leav": [32, 40], "length": [12, 20, 41], "less": [7, 39], "let": 49, "level": [2, 38, 52], "like": [2, 4, 5, 13, 16, 18, 22, 38, 39, 41, 42, 43, 44], "line": [16, 18, 22, 42, 43, 44], "linen": [16, 18, 22, 42, 43, 44], "link": 49, "list": [2, 3, 4, 5, 38, 39, 49], "load": [6, 38, 39], "load_buff": [6, 38, 39], "log_prob": [19, 41, 43], "log_std_max": [22, 41, 44], "log_std_min": [22, 41, 44], "logger": [2, 3, 38], "lorem": 53, "loss": [10, 14, 15, 17, 19, 41, 42, 43], "machin": 52, "make": [20, 41], "make_env": [24, 38, 40], "make_prioritised_item_buff": [20, 40, 41], "mani": 51, "map": [13, 41], "master": [18, 22, 32, 40, 43, 44], "match": [24, 30, 32, 40, 45], "max_abs_valu": [32, 40], "max_length": [20, 41], "max_recorded_prior": 39, "maxim": [7, 39], "maximum": [20, 32, 40, 41, 52], "mean": [7, 32, 38, 39, 40], "mean_std": [32, 40], "measur": [7, 39], "method": [6, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 39, 41, 42, 43, 44, 45, 52], "metric": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "min_length": [20, 41], "minim": [7, 39], "minimum": [20, 32, 40, 41, 52], "mlp": [16, 18, 22, 42, 43, 44], "mlpactorcrit": [18, 41, 43], "mlpq": [16, 41, 42], "mode": [22, 41, 44, 49], "model": [40, 41, 52], "modifi": [32, 40], "modul": [2, 4, 9, 10, 14, 16, 17, 18, 21, 22, 24, 33, 36, 55], "more": [20, 41], "mrp_file": [38, 39], "multi": 52, "multipl": 52, "must": [24, 30, 32, 40, 45], "mymodul": [16, 18, 22, 42, 43, 44], "n_critic": [22, 41, 44], "n_env": [10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 26, 27, 29, 30, 31, 40, 41, 42, 43, 44, 45], "n_eval_episod": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "n_eval_step": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "n_total_timestep": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "name": [6, 16, 18, 22, 24, 25, 30, 32, 36, 37, 39, 40, 41, 42, 43, 44, 45, 47], "namedtupl": [14, 15, 17, 19, 21, 23, 42, 43, 44], "nas_config": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "nas_config_sapc": [36, 37, 47], "naturecnn": [18, 22, 43, 44], "ndarrai": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46], "need": [24, 25, 45], "nest": [32, 40], "nestedmeanstd": [32, 38, 40], "network": [10, 14, 15, 16, 17, 18, 19, 21, 22, 23, 41, 42, 43, 44, 52], "network_param": [10, 14, 15, 17, 19, 41, 42, 43], "network_st": [41, 44], "neural": [10, 11, 14, 15, 17, 19, 21, 23, 36, 37, 41, 42, 43, 44, 47, 52], "new": [7, 8, 15, 19, 23, 32, 39, 40, 42, 43, 44], "next": [10, 14, 15, 41, 42], "next_observ": [10, 14, 15, 41, 42], "nn": [16, 18, 22, 42, 43, 44], "node": 39, "nodes_fil": [38, 39], "none": [2, 3, 4, 5, 6, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47], "norm": [8, 39], "normal": [32, 38, 40], "normalizer_st": [14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "note": [17, 19, 24, 25, 32, 40, 43, 45, 49], "notebook": [32, 40], "now": [16, 18, 22, 42, 43, 44], "np": [2, 4, 5, 38, 39], "npy": 39, "num_eval_episod": [2, 4, 5, 10, 11, 38, 39, 41], "number": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 30, 33, 34, 38, 39, 41, 42, 43, 44, 45, 46], "numpi": [27, 32, 40, 45], "numpy_to_jax": [27, 40, 45], "ob": [10, 11, 13, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "object": [2, 3, 4, 5, 6, 8, 13, 15, 16, 18, 19, 22, 23, 32, 33, 35, 36, 37, 38, 40, 41, 42, 43, 44, 46, 47, 52, 55], "objectivest": [2, 4, 5, 38, 39], "objectv": [7, 39], "obser": [33, 34, 46], "observ": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 41, 42, 43, 44, 45, 46], "observation_spac": [2, 4, 5, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 40, 45, 46, 55], "observationt": [2, 4, 5, 38, 39], "off": 52, "onc": [16, 18, 22, 42, 43, 44], "one": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 30, 38, 39, 41, 42, 43, 44, 45], "ones": 51, "onli": [17, 19, 32, 40, 43], "oper": [20, 41], "opt_stat": [10, 14, 15, 17, 19, 23, 41, 42, 43, 44], "optax": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "optim": [7, 10, 14, 15, 17, 19, 20, 21, 23, 39, 41, 42, 43, 44, 52], "optimize_object": [7, 39], "option": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47], "optstat": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "order": 49, "org": [32, 40, 49], "other": [7, 10, 14, 15, 16, 17, 18, 19, 21, 22, 23, 39, 41, 42, 43, 44], "output": 49, "overflow": [32, 40], "overrid": [7, 8, 39], "overriden": [6, 39], "own": 51, "packag": [2, 55], "page": [0, 48, 49, 54], "paper": [20, 41, 51], "param": [10, 14, 15, 17, 19, 23, 41, 42, 43, 44], "paramet": [2, 4, 5, 6, 7, 8, 10, 11, 12, 14, 15, 17, 19, 20, 21, 23, 24, 25, 30, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "parent": [16, 18, 22, 41, 42, 43, 44], "part": [6, 39], "pass": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 30, 32, 38, 39, 40, 41, 42, 43, 44, 45], "path": [2, 4, 5, 6, 38, 39], "per": [2, 4, 5, 10, 11, 14, 15, 17, 19, 20, 21, 23, 38, 39, 41, 42, 43, 44], "perform": [2, 4, 5, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 25, 32, 38, 39, 40, 41, 42, 43, 44, 45], "period": [12, 41], "pmap": [32, 40], "pmap_axis_nam": [32, 40], "png": [32, 40], "point": [32, 40], "polici": [10, 17, 19, 41, 43, 52], "possibl": [10, 11, 41], "possibli": [32, 40], "posssibl": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "ppo": [10, 21, 22, 23, 38, 39, 40, 41, 44, 52], "ppometr": [17, 19, 41, 43], "pporunnerst": [10, 17, 19, 41, 43], "ppostat": [10, 17, 19, 41, 43], "ppotrainingresult": [10, 17, 19, 41, 43], "ppotrainreturnt": [10, 17, 19, 41, 43], "ppotrainst": [17, 19, 41, 43], "precis": [32, 40], "predefin": 52, "predict": [10, 11, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "principl": 52, "print": 49, "prioriti": [6, 20, 39, 41], "prioritis": [20, 41], "prioritised_item_buff": [38, 40], "prioritisedtrajectorybuff": [20, 41], "prioritisedtrajectorybufferst": [6, 10, 12, 14, 15, 21, 23, 39, 41, 42, 44], "priority_expon": [20, 41], "priority_state_path": [6, 39], "prioriz": [12, 41], "prngkei": [10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "problem": 52, "proce": 51, "process": 52, "product": 49, "properti": [2, 4, 5, 10, 11, 24, 25, 26, 27, 28, 29, 31, 33, 34, 38, 39, 41, 45, 46], "provid": [13, 41, 51], "proxim": [10, 17, 19, 41, 43, 52], "py": [18, 22, 32, 40, 43, 44], "q": [10, 14, 15, 16, 41, 42, 52], "rais": [2, 4, 5, 38, 39], "random": [2, 4, 5, 10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 30, 33, 34, 38, 39, 41, 42, 43, 44, 45, 46, 52], "randomli": 52, "rang": [32, 40], "rank": [7, 38, 39], "re": [2, 4, 5, 38, 39, 51], "readthedoc": [32, 40], "real": 52, "recurs": [36, 37, 47], "recursive_concat": [36, 37, 38, 47], "refer": 49, "reinforc": [2, 4, 5, 10, 11, 38, 39, 41, 52], "relat": [6, 39], "remov": 49, "replac": [15, 19, 23, 32, 38, 40, 41, 42, 43, 44], "repo": 51, "report": 51, "requir": [6, 39], "reset": [2, 4, 5, 24, 25, 33, 34, 38, 39, 40, 45, 46, 55], "restor": [6, 39], "result": [6, 10, 11, 14, 15, 17, 19, 21, 23, 32, 33, 34, 39, 40, 41, 42, 43, 44, 46, 51], "return": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 14, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "return_buff": [17, 19, 41, 43], "return_buffer_idx": [17, 19, 41, 43], "reward": [7, 10, 11, 13, 14, 15, 19, 23, 39, 40, 41, 42, 43, 44], "reward_mean": 39, "reward_std": 39, "rewardmean": [7, 38, 39], "rewardstd": [7, 38, 39], "rl": [2, 4, 5, 24, 25, 26, 27, 28, 29, 30, 31, 38, 39, 45], "rm": [18, 22, 43, 44], "rng": [10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 41, 42, 43, 44, 45, 46], "rng_kei": [12, 41], "run": [2, 3, 4, 5, 32, 38, 39, 40], "run_arlbench": [2, 3, 38, 55], "runner": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "runner_st": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "running_statist": [38, 55], "runningstatisticsst": [14, 15, 17, 19, 21, 23, 32, 38, 40, 42, 43, 44], "runtim": [7, 38, 39], "sac": [10, 38, 39, 40, 41, 52], "saccnnactor": [22, 41, 44], "saccnncrit": [22, 41, 44], "sacmetr": [21, 23, 41, 44], "sacmlpactor": [22, 41, 44], "sacmlpcrit": [22, 41, 44], "sacrunnerst": [10, 21, 23, 41, 44], "sacstat": [10, 21, 23, 41, 44], "sactrainingresult": [10, 21, 23, 41, 44], "sactrainreturnt": [10, 21, 23, 41, 44], "sactrainst": [10, 21, 23, 41, 44], "sacvectorcrit": [22, 41, 44], "safe": [16, 18, 22, 42, 43, 44], "same": [32, 36, 37, 40, 47], "sampl": [10, 11, 12, 14, 15, 17, 19, 20, 21, 23, 24, 25, 41, 42, 43, 44, 45, 52], "sample_act": [24, 25, 40, 45], "sample_batch_s": [20, 41], "save": [6, 38, 39], "save_buff": [6, 38, 39], "save_defaults_to_yaml": [36, 37, 38, 47], "scalar": 39, "scalars_fil": [38, 39], "scope": [41, 42, 43, 44], "search": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44, 51, 52], "second": [36, 37, 47], "see": [16, 18, 22, 32, 40, 42, 43, 44], "seed": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 27, 28, 30, 36, 37, 38, 39, 41, 42, 43, 44, 45, 47], "self": [7, 8, 16, 18, 22, 39, 42, 43, 44], "sequenc": [12, 20, 41], "sequence_length": [12, 41], "set": [13, 32, 40, 41], "setup": [16, 18, 22, 41, 42, 43, 44], "shape": [10, 11, 32, 40, 41], "share": [10, 11, 41], "should": [32, 40, 51], "similar": [16, 18, 22, 42, 43, 44], "simplifi": [32, 40], "singl": [6, 20, 39, 41], "size": [6, 10, 11, 12, 20, 39, 41], "so": 51, "soft": [10, 21, 23, 41, 44, 52], "some": 49, "sort": [7, 39], "sourc": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "space": [2, 4, 5, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 26, 27, 28, 29, 31, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47, 51, 52], "specif": [7, 8, 39], "specifi": [15, 19, 23, 32, 40, 42, 43, 44], "stabil": 52, "stabl": [18, 22, 32, 40, 43, 44], "stable_baselines3": [18, 22, 43, 44], "standard": [7, 32, 39, 40], "state": [2, 4, 5, 6, 8, 10, 11, 12, 14, 15, 17, 19, 21, 23, 24, 25, 32, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46, 51], "state_featur": [38, 55], "statefeatur": [8, 38, 39], "static": [6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 39, 41, 42, 43, 44], "statist": [32, 40], "std": [32, 38, 40], "std_max_valu": [32, 40], "std_min_valu": [32, 40], "step": [2, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 38, 39, 40, 41, 42, 43, 44, 45, 46, 49, 55], "store": [6, 7, 8, 39], "str": [2, 4, 5, 6, 7, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 25, 30, 32, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 47], "string": [36, 37, 47], "structur": [32, 40], "sub": [24, 25, 45], "submodul": [16, 18, 22, 55], "subpackag": 55, "subsequ": [7, 8, 39], "summed_vari": [32, 38, 40], "support": [12, 24, 25, 41, 45], "surrog": 52, "t": [32, 40], "tag": [6, 39], "take": [24, 25, 33, 34, 45, 46], "taken": [32, 40], "tanh": [16, 18, 22, 42, 43, 44], "tanhtransformeddistribut": [22, 41, 44], "target": [10, 14, 15, 21, 23, 41, 42, 44], "target_param": [10, 14, 15, 23, 41, 42, 44], "td_error": [10, 14, 15, 21, 23, 41, 42, 44], "term": 49, "termin": [2, 4, 5, 38, 39], "than": [7, 39, 51], "thi": [0, 2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 16, 17, 18, 19, 21, 22, 23, 32, 38, 39, 40, 41, 42, 43, 44, 48, 49, 51, 52, 54], "three": [16, 18, 22, 42, 43, 44], "time": [20, 41], "timestep": [10, 11, 13, 14, 15, 17, 19, 21, 23, 40, 41, 42, 43, 44], "to_tupl": [40, 41], "top": [2, 38], "torch_lay": [18, 22, 43, 44], "total": [2, 4, 5, 7, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 41, 42, 43, 44], "tpu": [20, 41], "track_metr": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "track_trajectori": [10, 11, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "train": [2, 4, 5, 6, 7, 8, 10, 11, 14, 15, 17, 19, 21, 23, 38, 39, 40, 41, 42, 43, 44], "train_func": [7, 8, 39], "train_result": [6, 10, 11, 14, 15, 17, 19, 21, 23, 39, 41, 42, 43, 44], "train_stat": [10, 14, 15, 17, 19, 41, 42, 43], "trainfunc": [7, 8, 39], "training_result": [10, 11, 41], "trainresult": [6, 39], "trainstat": [15, 19, 23, 42, 43, 44], "trajectori": [10, 12, 14, 15, 17, 19, 20, 21, 23, 41, 42, 43, 44], "trajectorybufferst": [6, 39], "transform": [22, 44], "transit": [10, 14, 15, 17, 19, 20, 21, 23, 41, 42, 43, 44], "transitionsampl": [12, 41], "true": [10, 11, 14, 15, 16, 17, 18, 19, 21, 23, 32, 40, 41, 42, 43, 44], "truncat": [2, 4, 5, 38, 39], "tupl": [2, 3, 4, 5, 6, 10, 11, 14, 15, 17, 19, 21, 23, 24, 25, 33, 34, 36, 37, 38, 39, 41, 42, 43, 44, 45, 46, 47], "tuple1": [36, 37, 47], "tuple2": [36, 37, 47], "tuple_concat": [36, 37, 38, 47], "twice": [32, 40], "two": [7, 36, 37, 39, 47], "tx": [15, 19, 23, 42, 43, 44], "type": [2, 3, 4, 5, 6, 7, 8, 10, 11, 12, 14, 15, 17, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "u": [7, 8, 39], "under": [0, 48, 54], "uniform": [12, 41], "uniform_sampl": [12, 40, 41], "union": [17, 19, 21, 23, 41, 42, 43, 44, 45], "uniqu": [6, 39], "unus": [10, 14, 15, 17, 19, 21, 23, 41, 42, 43, 44], "updat": [10, 11, 14, 15, 17, 19, 21, 23, 32, 38, 40, 41, 42, 43, 44], "update_actor": [10, 21, 23, 40, 41, 44], "update_alpha": [10, 21, 23, 40, 41, 44], "update_crit": [10, 21, 23, 40, 41, 44], "update_hpo_config": [10, 11, 40, 41], "us": [2, 3, 4, 5, 7, 10, 11, 14, 15, 17, 19, 20, 21, 23, 24, 30, 32, 38, 39, 40, 41, 42, 43, 44, 45, 51, 52], "util": [32, 38, 40, 55], "valid": [32, 40], "validate_shap": [32, 40], "valu": [13, 15, 19, 23, 32, 36, 37, 40, 41, 42, 43, 44, 47], "valueerror": [2, 4, 5, 38, 39], "varianc": [32, 40], "variou": [24, 25, 45], "vault": [6, 39], "vault_uuid": [6, 39], "view": [13, 41], "wa": [2, 4, 5, 6, 32, 38, 39, 40], "we": [7, 8, 39, 51], "weigh": 52, "weight": [32, 40], "well": [6, 24, 25, 39, 45], "when": [16, 18, 22, 32, 40, 42, 43, 44, 51], "where": [6, 39, 51], "whether": [6, 7, 10, 11, 20, 39, 41], "which": [6, 16, 18, 22, 39, 42, 43, 44, 51], "while": [7, 8, 39], "wise": [36, 37, 47], "work": [16, 18, 22, 42, 43, 44, 51], "world": [49, 52], "would": 51, "wrap": [7, 8, 16, 18, 22, 33, 34, 39, 42, 43, 44, 46, 51], "wrapper": [24, 30, 38, 40, 45], "write": [36, 37, 47, 49], "x": [16, 18, 22, 27, 42, 43, 44, 45], "xland": [24, 30, 31, 45], "xland_env": [38, 40], "xlandenv": [31, 40, 45], "yaml": [36, 37, 47], "ye": 51, "yet": [16, 18, 22, 42, 43, 44], "you": 51, "your": [49, 51]}, "titles": ["Advanced Usage", "API References", "arlbench", "arlbench.arlbench", "arlbench.autorl", "arlbench.autorl.autorl_env", "arlbench.autorl.checkpointing", "arlbench.autorl.objectives", "arlbench.autorl.state_features", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.algorithm", "arlbench.core.algorithms.buffers", "arlbench.core.algorithms.common", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.dqn.dqn", "arlbench.core.algorithms.dqn.models", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.ppo.models", "arlbench.core.algorithms.ppo.ppo", "arlbench.core.algorithms.prioritised_item_buffer", "arlbench.core.algorithms.sac", "arlbench.core.algorithms.sac.models", "arlbench.core.algorithms.sac.sac", "arlbench.core.environments", "arlbench.core.environments.autorl_env", "arlbench.core.environments.brax_env", "arlbench.core.environments.envpool_env", "arlbench.core.environments.gymnasium_env", "arlbench.core.environments.gymnax_env", "arlbench.core.environments.make_env", "arlbench.core.environments.xland_env", "arlbench.core.running_statistics", "arlbench.core.wrappers", "arlbench.core.wrappers.flatten_observation", "arlbench.core.wrappers.wrapper", "arlbench.utils", "arlbench.utils.common", "arlbench package", "arlbench.autorl package", "arlbench.core package", "arlbench.core.algorithms package", "arlbench.core.algorithms.dqn package", "arlbench.core.algorithms.ppo package", "arlbench.core.algorithms.sac package", "arlbench.core.environments package", "arlbench.core.wrappers package", "arlbench.utils package", "Basic Usage", "Helpful Commands", "&lt;no title&gt;", "Frequently Asked Questions", "Glossary", "Home", "Installation", "arlbench"], "titleterms": {"advanc": 0, "algorithm": [10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 41, 42, 43, 44], "api": 1, "arlbench": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 55], "ask": 51, "autorl": [4, 5, 6, 7, 8, 39], "autorl_env": [5, 25, 39, 45], "basic": 48, "brax_env": [26, 45], "buffer": [12, 41], "checkpoint": [6, 39], "command": 49, "common": [13, 37, 41, 47], "content": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "core": [9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 40, 41, 42, 43, 44, 45, 46], "dqn": [14, 15, 16, 42], "environ": [24, 25, 26, 27, 28, 29, 30, 31, 45], "envpool_env": [27, 45], "flatten_observ": [34, 46], "frequent": 51, "glossari": 52, "gymnasium_env": [28, 45], "gymnax_env": [29, 45], "help": 49, "home": 53, "instal": 54, "make_env": [30, 45], "model": [16, 18, 22, 42, 43, 44], "modul": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "object": [7, 39], "packag": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "ppo": [17, 18, 19, 43], "prioritised_item_buff": [20, 41], "question": 51, "refer": 1, "running_statist": [32, 40], "sac": [21, 22, 23, 44], "state_featur": [8, 39], "submodul": [38, 39, 40, 41, 42, 43, 44, 45, 46, 47], "subpackag": [38, 40, 41], "usag": [0, 48], "util": [36, 37, 47], "wrapper": [33, 34, 35, 46], "xland_env": [31, 45]}})
\ No newline at end of file