diff --git a/main/.doctrees/advanced_usage/algorithm_states.doctree b/main/.doctrees/advanced_usage/algorithm_states.doctree
index 22ae7761e..e98858f2f 100644
Binary files a/main/.doctrees/advanced_usage/algorithm_states.doctree and b/main/.doctrees/advanced_usage/algorithm_states.doctree differ
diff --git a/main/.doctrees/advanced_usage/autorl_paradigms.doctree b/main/.doctrees/advanced_usage/autorl_paradigms.doctree
index 3999d1946..f7cde32eb 100644
Binary files a/main/.doctrees/advanced_usage/autorl_paradigms.doctree and b/main/.doctrees/advanced_usage/autorl_paradigms.doctree differ
diff --git a/main/.doctrees/advanced_usage/dynamic_configuration.doctree b/main/.doctrees/advanced_usage/dynamic_configuration.doctree
index 22524dea6..76f6bb701 100644
Binary files a/main/.doctrees/advanced_usage/dynamic_configuration.doctree and b/main/.doctrees/advanced_usage/dynamic_configuration.doctree differ
diff --git a/main/.doctrees/basic_usage/env_subsets.doctree b/main/.doctrees/basic_usage/env_subsets.doctree
index aaae1059d..371cb0e5e 100644
Binary files a/main/.doctrees/basic_usage/env_subsets.doctree and b/main/.doctrees/basic_usage/env_subsets.doctree differ
diff --git a/main/.doctrees/basic_usage/index.doctree b/main/.doctrees/basic_usage/index.doctree
index ac61c0f81..4a0ba2302 100644
Binary files a/main/.doctrees/basic_usage/index.doctree and b/main/.doctrees/basic_usage/index.doctree differ
diff --git a/main/.doctrees/basic_usage/objectives.doctree b/main/.doctrees/basic_usage/objectives.doctree
index e67ce209c..4564dccdd 100644
Binary files a/main/.doctrees/basic_usage/objectives.doctree and b/main/.doctrees/basic_usage/objectives.doctree differ
diff --git a/main/.doctrees/basic_usage/options.doctree b/main/.doctrees/basic_usage/options.doctree
index 780c38661..fa4650ae4 100644
Binary files a/main/.doctrees/basic_usage/options.doctree and b/main/.doctrees/basic_usage/options.doctree differ
diff --git a/main/.doctrees/basic_usage/seeding.doctree b/main/.doctrees/basic_usage/seeding.doctree
index 6d4ad7d77..e66e6605b 100644
Binary files a/main/.doctrees/basic_usage/seeding.doctree and b/main/.doctrees/basic_usage/seeding.doctree differ
diff --git a/main/.doctrees/environment.pickle b/main/.doctrees/environment.pickle
index 3f8b80e02..a80b3ce54 100644
Binary files a/main/.doctrees/environment.pickle and b/main/.doctrees/environment.pickle differ
diff --git a/main/_sources/advanced_usage/algorithm_states.rst.txt b/main/_sources/advanced_usage/algorithm_states.rst.txt
index b0f2a40f9..92591589d 100644
--- a/main/_sources/advanced_usage/algorithm_states.rst.txt
+++ b/main/_sources/advanced_usage/algorithm_states.rst.txt
@@ -1,2 +1,4 @@
 Using the ARLBench States
-==========================
\ No newline at end of file
+==========================
+
+In addition to providing different objectives, ARLBench also provides insights into the target algorithms' internal states.
\ No newline at end of file
diff --git a/main/_sources/advanced_usage/autorl_paradigms.rst.txt b/main/_sources/advanced_usage/autorl_paradigms.rst.txt
index 1bc5a5827..9c8a29ef1 100644
--- a/main/_sources/advanced_usage/autorl_paradigms.rst.txt
+++ b/main/_sources/advanced_usage/autorl_paradigms.rst.txt
@@ -1,2 +1,4 @@
 ARLBench and Different AutoRL Paradigms
-=======================================
\ No newline at end of file
+=======================================
+
+TODO: relationship to other AutoRL paradigms
\ No newline at end of file
diff --git a/main/_sources/advanced_usage/dynamic_configuration.rst.txt b/main/_sources/advanced_usage/dynamic_configuration.rst.txt
index ae8b3b26d..5d6cde095 100644
--- a/main/_sources/advanced_usage/dynamic_configuration.rst.txt
+++ b/main/_sources/advanced_usage/dynamic_configuration.rst.txt
@@ -1,2 +1,4 @@
 Dynamic Configuration in ARLBench
-==================================
\ No newline at end of file
+==================================
+
+How to dynamic?
\ No newline at end of file
diff --git a/main/_sources/basic_usage/env_subsets.rst.txt b/main/_sources/basic_usage/env_subsets.rst.txt
index 7734e9d75..69aeafa24 100644
--- a/main/_sources/basic_usage/env_subsets.rst.txt
+++ b/main/_sources/basic_usage/env_subsets.rst.txt
@@ -1,2 +1,12 @@
 The ARLBench Subsets
-====================
\ No newline at end of file
+====================
+
+We analyzed the hyperparameter landscapes of PPO, DQN and SAC on 20 environments to select a subset which allows for efficient benchmarking of AutoRL algorithms. These are the resulting subsets:
+
+.. image:: path/subsets.png
+  :width: 800
+  :alt: Alternative text
+
+We strongly recommend you focus your benchmarking on these exact environments to ensure you cover the space total landscape of RL behaviors well. 
+The data generated for selecting these environments is available on `HuggingFace <https://huggingface.co/datasets/autorl-org/arlbench>`_ for you to use in your experiments.
+For more information how the subset selection was done, please refer to our paper.
\ No newline at end of file
diff --git a/main/_sources/basic_usage/index.rst.txt b/main/_sources/basic_usage/index.rst.txt
index 621ec6ad4..c1a1cc4bf 100644
--- a/main/_sources/basic_usage/index.rst.txt
+++ b/main/_sources/basic_usage/index.rst.txt
@@ -9,6 +9,7 @@ Benchmarking AutoRL Methods
    seeding
 
 
+
 ARLBench provides an basis for benchmarking different AutoRL methods. This section of the documentation focuses on the prominent aspect of black-box hyperparameter optimization, since it's the simplest usecase of ARLBench.
 We discuss the structure of ARLBenchmark, the currently supported objectives, the environment subsets and search spaces we provide and the seeding of the experiments in their own subpages. 
 The most important question, however, is how to actually use ARLBench in your experiments. This is the workflow we propose:
diff --git a/main/_sources/basic_usage/objectives.rst.txt b/main/_sources/basic_usage/objectives.rst.txt
index 59f2be739..1a59039a6 100644
--- a/main/_sources/basic_usage/objectives.rst.txt
+++ b/main/_sources/basic_usage/objectives.rst.txt
@@ -1,2 +1,15 @@
 Objectives in ARLBench
-======================
\ No newline at end of file
+======================
+
+ARLBench allows to configure the objectives you'd like to use for your AutoRL methods. 
+These are selected as a list of keywords in the configuration of the AutoRL Environment, e.g. like this:
+
+.. code-block:: bash
+
+    python arlbench.py autorl.objectives=["reward_mean"]
+
+The following objectives are available at the moment:
+- reward_mean: the mean evaluation reward across a number of evaluation episodes
+- reward_std: the standard deviation of the evaluation rewards across a number of evaluation episodes
+- runtime: the runtime of the training process
+- emissions: the CO2 emissions of the training process
\ No newline at end of file
diff --git a/main/_sources/basic_usage/options.rst.txt b/main/_sources/basic_usage/options.rst.txt
index bf2b2f3f1..3c499bc81 100644
--- a/main/_sources/basic_usage/options.rst.txt
+++ b/main/_sources/basic_usage/options.rst.txt
@@ -1,2 +1,28 @@
 ARLBench Options
-================
\ No newline at end of file
+================
+
+A given training run in ARLBench can be configured on two levels: the lower one is the configuration that happens via the AutoRL tool we benchmark while the upper level decides the setting we test the AutoRL tool in.
+The high level configuration takes place via the 'autorl' keys in the configuration file. These are the available options:
+
+- **seed**: The seed for the random number generator 
+- **env_framework**: Environment framework to use. Currently supported: gymnax, envpool, brax, xland
+- **env_name**: The name of the environment to use
+- **env_kwargs**: Additional keyword arguments for the environment
+- **eval_env_kwargs**: Additional keyword arguments for the evaluation environment
+- **n_envs**: Number of environments to use in parallel
+- **algorithm**: The algorithm to use. Currently supported: dqn, ppo, sac
+- **cnn_policy**: Whether to use a CNN policy
+- **deterministic_eval**: Whether to use deterministic evaluation. This diables exploration behaviors in evaluation.
+- **nas_config**: Configuration for architecture
+- **checkpoint**: A list of elements the checkpoint should contain 
+- **checkpoint_name**: The name of the checkpoint
+- **checkpoint_dir**: The directory to save the checkpoint in
+- **objectives**: The objectives to optimize for. Currently supported: reward_mean, reward_std, runtime, emissions
+- **optimize_objectives**: Whether to maximize or minimize the objectives
+- **state_features**: The features of the RL algorithm's state to return
+- **n_steps**: The number of steps in the configuration schedule. Using 1 will result in a static configuration
+- **n_total_timesteps**: The total number of timesteps to train in each schedule interval
+- **n_eval_steps**: The number of steps to evaluate the agent for
+- **n_eval_episodes**: The number of episodes to evaluate the agent for
+
+The low level configuration options can be found in the 'hp_config' key set, containing the configurable hyperparameters and architecture of each algorithm. Please refer to the search space overview for more information.
diff --git a/main/_sources/basic_usage/seeding.rst.txt b/main/_sources/basic_usage/seeding.rst.txt
index 89fa99ad1..983eafe0c 100644
--- a/main/_sources/basic_usage/seeding.rst.txt
+++ b/main/_sources/basic_usage/seeding.rst.txt
@@ -1,2 +1,4 @@
 Considerations for Seeding
-============================
\ No newline at end of file
+============================
+
+Seeding is important both on the level of RL algorithms as well as the AutoRL level.
\ No newline at end of file
diff --git a/main/advanced_usage/algorithm_states.html b/main/advanced_usage/algorithm_states.html
index b90d8dc27..bce8f7d21 100644
--- a/main/advanced_usage/algorithm_states.html
+++ b/main/advanced_usage/algorithm_states.html
@@ -301,6 +301,7 @@
                 
   <section id="using-the-arlbench-states">
 <h1>Using the ARLBench States<a class="headerlink" href="#using-the-arlbench-states" title="Link to this heading">¶</a></h1>
+<p>In addition to providing different objectives, ARLBench also provides insights into the target algorithms’ internal states.</p>
 </section>
 
 
diff --git a/main/advanced_usage/autorl_paradigms.html b/main/advanced_usage/autorl_paradigms.html
index b03884f9d..6d8af0627 100644
--- a/main/advanced_usage/autorl_paradigms.html
+++ b/main/advanced_usage/autorl_paradigms.html
@@ -301,6 +301,7 @@
                 
   <section id="arlbench-and-different-autorl-paradigms">
 <h1>ARLBench and Different AutoRL Paradigms<a class="headerlink" href="#arlbench-and-different-autorl-paradigms" title="Link to this heading">¶</a></h1>
+<p>TODO: relationship to other AutoRL paradigms</p>
 </section>
 
 
diff --git a/main/advanced_usage/dynamic_configuration.html b/main/advanced_usage/dynamic_configuration.html
index 923f13322..c2924873d 100644
--- a/main/advanced_usage/dynamic_configuration.html
+++ b/main/advanced_usage/dynamic_configuration.html
@@ -301,6 +301,7 @@
                 
   <section id="dynamic-configuration-in-arlbench">
 <h1>Dynamic Configuration in ARLBench<a class="headerlink" href="#dynamic-configuration-in-arlbench" title="Link to this heading">¶</a></h1>
+<p>How to dynamic?</p>
 </section>
 
 
diff --git a/main/basic_usage/env_subsets.html b/main/basic_usage/env_subsets.html
index b4837fe74..fe318a915 100644
--- a/main/basic_usage/env_subsets.html
+++ b/main/basic_usage/env_subsets.html
@@ -301,6 +301,12 @@
                 
   <section id="the-arlbench-subsets">
 <h1>The ARLBench Subsets<a class="headerlink" href="#the-arlbench-subsets" title="Link to this heading">¶</a></h1>
+<p>We analyzed the hyperparameter landscapes of PPO, DQN and SAC on 20 environments to select a subset which allows for efficient benchmarking of AutoRL algorithms. These are the resulting subsets:</p>
+<a class="reference internal image-reference" href="basic_usage/path/subsets.png"><img alt="Alternative text" src="basic_usage/path/subsets.png" style="width: 800px;" />
+</a>
+<p>We strongly recommend you focus your benchmarking on these exact environments to ensure you cover the space total landscape of RL behaviors well.
+The data generated for selecting these environments is available on <a class="reference external" href="https://huggingface.co/datasets/autorl-org/arlbench">HuggingFace</a> for you to use in your experiments.
+For more information how the subset selection was done, please refer to our paper.</p>
 </section>
 
 
diff --git a/main/basic_usage/objectives.html b/main/basic_usage/objectives.html
index 40b80efa4..73c36b921 100644
--- a/main/basic_usage/objectives.html
+++ b/main/basic_usage/objectives.html
@@ -301,6 +301,16 @@
                 
   <section id="objectives-in-arlbench">
 <h1>Objectives in ARLBench<a class="headerlink" href="#objectives-in-arlbench" title="Link to this heading">¶</a></h1>
+<p>ARLBench allows to configure the objectives you’d like to use for your AutoRL methods.
+These are selected as a list of keywords in the configuration of the AutoRL Environment, e.g. like this:</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>python<span class="w"> </span>arlbench.py<span class="w"> </span>autorl.objectives<span class="o">=[</span><span class="s2">&quot;reward_mean&quot;</span><span class="o">]</span>
+</pre></div>
+</div>
+<p>The following objectives are available at the moment:
+- reward_mean: the mean evaluation reward across a number of evaluation episodes
+- reward_std: the standard deviation of the evaluation rewards across a number of evaluation episodes
+- runtime: the runtime of the training process
+- emissions: the CO2 emissions of the training process</p>
 </section>
 
 
diff --git a/main/basic_usage/options.html b/main/basic_usage/options.html
index ed078a4b0..1c76f9e02 100644
--- a/main/basic_usage/options.html
+++ b/main/basic_usage/options.html
@@ -301,6 +301,31 @@
                 
   <section id="arlbench-options">
 <h1>ARLBench Options<a class="headerlink" href="#arlbench-options" title="Link to this heading">¶</a></h1>
+<p>A given training run in ARLBench can be configured on two levels: the lower one is the configuration that happens via the AutoRL tool we benchmark while the upper level decides the setting we test the AutoRL tool in.
+The high level configuration takes place via the ‘autorl’ keys in the configuration file. These are the available options:</p>
+<ul class="simple">
+<li><p><strong>seed</strong>: The seed for the random number generator</p></li>
+<li><p><strong>env_framework</strong>: Environment framework to use. Currently supported: gymnax, envpool, brax, xland</p></li>
+<li><p><strong>env_name</strong>: The name of the environment to use</p></li>
+<li><p><strong>env_kwargs</strong>: Additional keyword arguments for the environment</p></li>
+<li><p><strong>eval_env_kwargs</strong>: Additional keyword arguments for the evaluation environment</p></li>
+<li><p><strong>n_envs</strong>: Number of environments to use in parallel</p></li>
+<li><p><strong>algorithm</strong>: The algorithm to use. Currently supported: dqn, ppo, sac</p></li>
+<li><p><strong>cnn_policy</strong>: Whether to use a CNN policy</p></li>
+<li><p><strong>deterministic_eval</strong>: Whether to use deterministic evaluation. This diables exploration behaviors in evaluation.</p></li>
+<li><p><strong>nas_config</strong>: Configuration for architecture</p></li>
+<li><p><strong>checkpoint</strong>: A list of elements the checkpoint should contain</p></li>
+<li><p><strong>checkpoint_name</strong>: The name of the checkpoint</p></li>
+<li><p><strong>checkpoint_dir</strong>: The directory to save the checkpoint in</p></li>
+<li><p><strong>objectives</strong>: The objectives to optimize for. Currently supported: reward_mean, reward_std, runtime, emissions</p></li>
+<li><p><strong>optimize_objectives</strong>: Whether to maximize or minimize the objectives</p></li>
+<li><p><strong>state_features</strong>: The features of the RL algorithm’s state to return</p></li>
+<li><p><strong>n_steps</strong>: The number of steps in the configuration schedule. Using 1 will result in a static configuration</p></li>
+<li><p><strong>n_total_timesteps</strong>: The total number of timesteps to train in each schedule interval</p></li>
+<li><p><strong>n_eval_steps</strong>: The number of steps to evaluate the agent for</p></li>
+<li><p><strong>n_eval_episodes</strong>: The number of episodes to evaluate the agent for</p></li>
+</ul>
+<p>The low level configuration options can be found in the ‘hp_config’ key set, containing the configurable hyperparameters and architecture of each algorithm. Please refer to the search space overview for more information.</p>
 </section>
 
 
diff --git a/main/basic_usage/seeding.html b/main/basic_usage/seeding.html
index 70408f162..0f90d0d91 100644
--- a/main/basic_usage/seeding.html
+++ b/main/basic_usage/seeding.html
@@ -301,6 +301,7 @@
                 
   <section id="considerations-for-seeding">
 <h1>Considerations for Seeding<a class="headerlink" href="#considerations-for-seeding" title="Link to this heading">¶</a></h1>
+<p>Seeding is important both on the level of RL algorithms as well as the AutoRL level.</p>
 </section>
 
 
diff --git a/main/searchindex.js b/main/searchindex.js
index 8bd516bab..99efa2d94 100644
--- a/main/searchindex.js
+++ b/main/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"alltitles": {"API References": [[4, "api-references"]], "ARLBench Options": [[54, "arlbench-options"]], "ARLBench and Different AutoRL Paradigms": [[1, "arlbench-and-different-autorl-paradigms"]], "Advanced Configuration Options": [[3, "advanced-configuration-options"]], "Benchmarking AutoRL Methods": [[52, "benchmarking-autorl-methods"]], "Considerations for Seeding": [[55, "considerations-for-seeding"]], "Dynamic Configuration in ARLBench": [[2, "dynamic-configuration-in-arlbench"]], "Frequently Asked Questions": [[57, "frequently-asked-questions"]], "Glossary": [[58, "glossary"]], "Home": [[59, "home"]], "Installation": [[60, "installation"]], "Module contents": [[41, "module-arlbench"], [42, "module-arlbench.autorl"], [43, "module-arlbench.core"], [44, "module-arlbench.core.algorithms"], [45, "module-arlbench.core.algorithms.dqn"], [46, "module-arlbench.core.algorithms.ppo"], [47, "module-arlbench.core.algorithms.sac"], [48, "module-arlbench.core.environments"], [49, "module-arlbench.core.wrappers"], [50, "module-arlbench.utils"]], "Objectives in ARLBench": [[53, "objectives-in-arlbench"]], "Submodules": [[41, "submodules"], [42, "submodules"], [43, "submodules"], [44, "submodules"], [45, "submodules"], [46, "submodules"], [47, "submodules"], [48, "submodules"], [49, "submodules"], [50, "submodules"]], "Subpackages": [[41, "subpackages"], [43, "subpackages"], [44, "subpackages"]], "The ARLBench Subsets": [[51, "the-arlbench-subsets"]], "Using the ARLBench States": [[0, "using-the-arlbench-states"]], "arlbench": [[5, "module-arlbench"], [61, "arlbench"]], "arlbench package": [[41, "arlbench-package"]], "arlbench.arlbench": [[6, "module-arlbench.arlbench"]], "arlbench.arlbench module": [[41, "module-arlbench.arlbench"]], "arlbench.autorl": [[7, "module-arlbench.autorl"]], "arlbench.autorl package": [[42, "arlbench-autorl-package"]], "arlbench.autorl.autorl_env": [[8, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.autorl_env module": [[42, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.checkpointing": [[9, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.checkpointing module": [[42, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.objectives": [[10, "module-arlbench.autorl.objectives"]], "arlbench.autorl.objectives module": [[42, "module-arlbench.autorl.objectives"]], "arlbench.autorl.state_features": [[11, "module-arlbench.autorl.state_features"]], "arlbench.autorl.state_features module": [[42, "module-arlbench.autorl.state_features"]], "arlbench.core": [[12, "module-arlbench.core"]], "arlbench.core package": [[43, "arlbench-core-package"]], "arlbench.core.algorithms": [[13, "module-arlbench.core.algorithms"]], "arlbench.core.algorithms package": [[44, "arlbench-core-algorithms-package"]], "arlbench.core.algorithms.algorithm": [[14, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.algorithm module": [[44, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.buffers": [[15, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.buffers module": [[44, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.common": [[16, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.common module": [[44, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.dqn": [[17, "module-arlbench.core.algorithms.dqn"]], "arlbench.core.algorithms.dqn package": [[45, "arlbench-core-algorithms-dqn-package"]], "arlbench.core.algorithms.dqn.dqn": [[18, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.dqn module": [[45, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.models": [[19, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.dqn.models module": [[45, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.ppo": [[20, "module-arlbench.core.algorithms.ppo"]], "arlbench.core.algorithms.ppo package": [[46, "arlbench-core-algorithms-ppo-package"]], "arlbench.core.algorithms.ppo.models": [[21, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.models module": [[46, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.ppo": [[22, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.ppo.ppo module": [[46, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.prioritised_item_buffer": [[23, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.prioritised_item_buffer module": [[44, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[24, "module-arlbench.core.algorithms.sac"]], "arlbench.core.algorithms.sac package": [[47, "arlbench-core-algorithms-sac-package"]], "arlbench.core.algorithms.sac.models": [[25, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.models module": [[47, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.sac": [[26, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.algorithms.sac.sac module": [[47, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.environments": [[27, "module-arlbench.core.environments"]], "arlbench.core.environments package": [[48, "arlbench-core-environments-package"]], "arlbench.core.environments.autorl_env": [[28, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.autorl_env module": [[48, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.brax_env": [[29, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.brax_env module": [[48, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.envpool_env": [[30, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.envpool_env module": [[48, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.gymnasium_env": [[31, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnasium_env module": [[48, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnax_env": [[32, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.gymnax_env module": [[48, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.make_env": [[33, "arlbench-core-environments-make-env"]], "arlbench.core.environments.make_env module": [[48, "module-arlbench.core.environments.make_env"]], "arlbench.core.environments.xland_env": [[34, "module-arlbench.core.environments.xland_env"]], "arlbench.core.environments.xland_env module": [[48, "module-arlbench.core.environments.xland_env"]], "arlbench.core.running_statistics": [[35, "module-arlbench.core.running_statistics"]], "arlbench.core.running_statistics module": [[43, "module-arlbench.core.running_statistics"]], "arlbench.core.wrappers": [[36, "module-arlbench.core.wrappers"]], "arlbench.core.wrappers package": [[49, "arlbench-core-wrappers-package"]], "arlbench.core.wrappers.flatten_observation": [[37, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.flatten_observation module": [[49, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.wrapper": [[38, "module-arlbench.core.wrappers.wrapper"]], "arlbench.core.wrappers.wrapper module": [[49, "module-arlbench.core.wrappers.wrapper"]], "arlbench.utils": [[39, "module-arlbench.utils"]], "arlbench.utils package": [[50, "arlbench-utils-package"]], "arlbench.utils.common": [[40, "module-arlbench.utils.common"]], "arlbench.utils.common module": [[50, "module-arlbench.utils.common"]]}, "docnames": ["advanced_usage/algorithm_states", "advanced_usage/autorl_paradigms", "advanced_usage/dynamic_configuration", "advanced_usage/index", "api", "api/arlbench", "api/arlbench.arlbench", "api/arlbench.autorl", "api/arlbench.autorl.autorl_env", "api/arlbench.autorl.checkpointing", "api/arlbench.autorl.objectives", "api/arlbench.autorl.state_features", "api/arlbench.core", "api/arlbench.core.algorithms", "api/arlbench.core.algorithms.algorithm", "api/arlbench.core.algorithms.buffers", "api/arlbench.core.algorithms.common", "api/arlbench.core.algorithms.dqn", "api/arlbench.core.algorithms.dqn.dqn", "api/arlbench.core.algorithms.dqn.models", "api/arlbench.core.algorithms.ppo", "api/arlbench.core.algorithms.ppo.models", "api/arlbench.core.algorithms.ppo.ppo", "api/arlbench.core.algorithms.prioritised_item_buffer", "api/arlbench.core.algorithms.sac", "api/arlbench.core.algorithms.sac.models", "api/arlbench.core.algorithms.sac.sac", "api/arlbench.core.environments", "api/arlbench.core.environments.autorl_env", "api/arlbench.core.environments.brax_env", "api/arlbench.core.environments.envpool_env", "api/arlbench.core.environments.gymnasium_env", "api/arlbench.core.environments.gymnax_env", "api/arlbench.core.environments.make_env", "api/arlbench.core.environments.xland_env", "api/arlbench.core.running_statistics", "api/arlbench.core.wrappers", "api/arlbench.core.wrappers.flatten_observation", "api/arlbench.core.wrappers.wrapper", "api/arlbench.utils", "api/arlbench.utils.common", "arlbench", "arlbench.autorl", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.sac", "arlbench.core.environments", "arlbench.core.wrappers", "arlbench.utils", "basic_usage/env_subsets", "basic_usage/index", "basic_usage/objectives", "basic_usage/options", "basic_usage/seeding", "contributing", "faq", "glossary", "index", "installation", "modules"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["advanced_usage/algorithm_states.rst", "advanced_usage/autorl_paradigms.rst", "advanced_usage/dynamic_configuration.rst", "advanced_usage/index.rst", "api.rst", "api/arlbench.rst", "api/arlbench.arlbench.rst", "api/arlbench.autorl.rst", "api/arlbench.autorl.autorl_env.rst", "api/arlbench.autorl.checkpointing.rst", "api/arlbench.autorl.objectives.rst", "api/arlbench.autorl.state_features.rst", "api/arlbench.core.rst", "api/arlbench.core.algorithms.rst", "api/arlbench.core.algorithms.algorithm.rst", "api/arlbench.core.algorithms.buffers.rst", "api/arlbench.core.algorithms.common.rst", "api/arlbench.core.algorithms.dqn.rst", "api/arlbench.core.algorithms.dqn.dqn.rst", "api/arlbench.core.algorithms.dqn.models.rst", "api/arlbench.core.algorithms.ppo.rst", "api/arlbench.core.algorithms.ppo.models.rst", "api/arlbench.core.algorithms.ppo.ppo.rst", "api/arlbench.core.algorithms.prioritised_item_buffer.rst", "api/arlbench.core.algorithms.sac.rst", "api/arlbench.core.algorithms.sac.models.rst", "api/arlbench.core.algorithms.sac.sac.rst", "api/arlbench.core.environments.rst", "api/arlbench.core.environments.autorl_env.rst", "api/arlbench.core.environments.brax_env.rst", "api/arlbench.core.environments.envpool_env.rst", "api/arlbench.core.environments.gymnasium_env.rst", "api/arlbench.core.environments.gymnax_env.rst", "api/arlbench.core.environments.make_env.rst", "api/arlbench.core.environments.xland_env.rst", "api/arlbench.core.running_statistics.rst", "api/arlbench.core.wrappers.rst", "api/arlbench.core.wrappers.flatten_observation.rst", "api/arlbench.core.wrappers.wrapper.rst", "api/arlbench.utils.rst", "api/arlbench.utils.common.rst", "arlbench.rst", "arlbench.autorl.rst", "arlbench.core.rst", "arlbench.core.algorithms.rst", "arlbench.core.algorithms.dqn.rst", "arlbench.core.algorithms.ppo.rst", "arlbench.core.algorithms.sac.rst", "arlbench.core.environments.rst", "arlbench.core.wrappers.rst", "arlbench.utils.rst", "basic_usage/env_subsets.rst", "basic_usage/index.rst", "basic_usage/objectives.rst", "basic_usage/options.rst", "basic_usage/seeding.rst", "contributing.rst", "faq.rst", "glossary.rst", "index.rst", "installation.rst", "modules.rst"], "indexentries": {"__call__() (arlbench.autorl.objectives.emissions static method)": [[10, "arlbench.autorl.objectives.Emissions.__call__", false], [42, "arlbench.autorl.objectives.Emissions.__call__", false]], "__call__() (arlbench.autorl.objectives.objective static method)": [[10, "arlbench.autorl.objectives.Objective.__call__", false], [42, "arlbench.autorl.objectives.Objective.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardmean static method)": [[10, "arlbench.autorl.objectives.RewardMean.__call__", false], [42, "arlbench.autorl.objectives.RewardMean.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardstd static method)": [[10, "arlbench.autorl.objectives.RewardStd.__call__", false], [42, "arlbench.autorl.objectives.RewardStd.__call__", false]], "__call__() (arlbench.autorl.objectives.runtime static method)": [[10, "arlbench.autorl.objectives.Runtime.__call__", false], [42, "arlbench.autorl.objectives.Runtime.__call__", false]], "__call__() (arlbench.autorl.state_features.gradinfo static method)": [[11, "arlbench.autorl.state_features.GradInfo.__call__", false], [42, "arlbench.autorl.state_features.GradInfo.__call__", false]], "__call__() (arlbench.autorl.state_features.statefeature static method)": [[11, "arlbench.autorl.state_features.StateFeature.__call__", false], [42, "arlbench.autorl.state_features.StateFeature.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.cnnq method)": [[19, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false], [45, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.mlpq method)": [[19, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false], [45, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false], [46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false], [46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.alphacoef method)": [[25, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false], [47, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacvectorcritic method)": [[25, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false]], "__lt__() (arlbench.autorl.objectives.objective method)": [[10, "arlbench.autorl.objectives.Objective.__lt__", false], [42, "arlbench.autorl.objectives.Objective.__lt__", false]], "__new__() (arlbench.autorl.objectives.objective static method)": [[10, "arlbench.autorl.objectives.Objective.__new__", false], [42, "arlbench.autorl.objectives.Objective.__new__", false]], "__new__() (arlbench.autorl.state_features.statefeature static method)": [[11, "arlbench.autorl.state_features.StateFeature.__new__", false], [42, "arlbench.autorl.state_features.StateFeature.__new__", false]], "action (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.action", false]], "action (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.action", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.action", false]], "action (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.action", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.action", false]], "action (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.action", false], [47, "arlbench.core.algorithms.sac.sac.Transition.action", false]], "action_dim (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.action_dim", false]], "action_dim (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.action_dim", false]], "action_space (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false]], "action_space (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.action_space", false], [42, "arlbench.autorl.AutoRLEnv.action_space", false]], "action_space (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.action_space", false], [41, "arlbench.AutoRLEnv.action_space", false]], "action_space (arlbench.core.environments.brax_env.braxenv property)": [[29, "arlbench.core.environments.brax_env.BraxEnv.action_space", false], [48, "arlbench.core.environments.brax_env.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.braxenv property)": [[27, "arlbench.core.environments.BraxEnv.action_space", false], [48, "arlbench.core.environments.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[30, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false], [48, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.envpoolenv property)": [[27, "arlbench.core.environments.EnvpoolEnv.action_space", false], [48, "arlbench.core.environments.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[31, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false], [48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasiumenv property)": [[27, "arlbench.core.environments.GymnasiumEnv.action_space", false], [48, "arlbench.core.environments.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[32, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false], [48, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.gymnaxenv property)": [[27, "arlbench.core.environments.GymnaxEnv.action_space", false], [48, "arlbench.core.environments.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.xland_env.xlandenv property)": [[34, "arlbench.core.environments.xland_env.XLandEnv.action_space", false], [48, "arlbench.core.environments.xland_env.XLandEnv.action_space", false]], "action_space() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.action_space", false], [48, "arlbench.core.environments.autorl_env.Environment.action_space", false]], "action_space() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.action_space", false], [48, "arlbench.core.environments.Environment.action_space", false]], "action_type (arlbench.core.algorithms.algorithm property)": [[13, "arlbench.core.algorithms.Algorithm.action_type", false], [44, "arlbench.core.algorithms.Algorithm.action_type", false]], "action_type (arlbench.core.algorithms.algorithm.algorithm property)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false]], "activation (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.activation", false]], "activation (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.activation", false]], "activation (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.activation", false]], "activation (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.activation", false]], "actor_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false]], "actor_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false], [47, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false]], "actor_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false]], "actor_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false], [47, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false]], "actor_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false]], "actor_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false]], "advantages (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false]], "advantages (arlbench.core.algorithms.ppo.ppometrics attribute)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false]], "algorithm (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.Algorithm", false], [44, "arlbench.core.algorithms.Algorithm", false]], "algorithm (class in arlbench.core.algorithms.algorithm)": [[14, "arlbench.core.algorithms.algorithm.Algorithm", false], [44, "arlbench.core.algorithms.algorithm.Algorithm", false]], "algorithms (arlbench.autorl.autorl_env.autorlenv attribute)": [[42, "arlbench.autorl.autorl_env.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorl.autorlenv attribute)": [[42, "arlbench.autorl.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorlenv attribute)": [[41, "arlbench.AutoRLEnv.ALGORITHMS", false]], "alpha_init (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.alpha_init", false]], "alpha_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false]], "alpha_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false], [47, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false]], "alpha_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false]], "alpha_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false]], "alphacoef (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.AlphaCoef", false], [47, "arlbench.core.algorithms.sac.models.AlphaCoef", false]], "arlbench": [[5, "module-arlbench", false], [41, "module-arlbench", false]], "arlbench.arlbench": [[6, "module-arlbench.arlbench", false], [41, "module-arlbench.arlbench", false]], "arlbench.autorl": [[7, "module-arlbench.autorl", false], [42, "module-arlbench.autorl", false]], "arlbench.autorl.autorl_env": [[8, "module-arlbench.autorl.autorl_env", false], [42, "module-arlbench.autorl.autorl_env", false]], "arlbench.autorl.checkpointing": [[9, "module-arlbench.autorl.checkpointing", false], [42, "module-arlbench.autorl.checkpointing", false]], "arlbench.autorl.objectives": [[10, "module-arlbench.autorl.objectives", false], [42, "module-arlbench.autorl.objectives", false]], "arlbench.autorl.state_features": [[11, "module-arlbench.autorl.state_features", false], [42, "module-arlbench.autorl.state_features", false]], "arlbench.core": [[12, "module-arlbench.core", false], [43, "module-arlbench.core", false]], "arlbench.core.algorithms": [[13, "module-arlbench.core.algorithms", false], [44, "module-arlbench.core.algorithms", false]], "arlbench.core.algorithms.algorithm": [[14, "module-arlbench.core.algorithms.algorithm", false], [44, "module-arlbench.core.algorithms.algorithm", false]], "arlbench.core.algorithms.buffers": [[15, "module-arlbench.core.algorithms.buffers", false], [44, "module-arlbench.core.algorithms.buffers", false]], "arlbench.core.algorithms.common": [[16, "module-arlbench.core.algorithms.common", false], [44, "module-arlbench.core.algorithms.common", false]], "arlbench.core.algorithms.dqn": [[17, "module-arlbench.core.algorithms.dqn", false], [45, "module-arlbench.core.algorithms.dqn", false]], "arlbench.core.algorithms.dqn.dqn": [[18, "module-arlbench.core.algorithms.dqn.dqn", false], [45, "module-arlbench.core.algorithms.dqn.dqn", false]], "arlbench.core.algorithms.dqn.models": [[19, "module-arlbench.core.algorithms.dqn.models", false], [45, "module-arlbench.core.algorithms.dqn.models", false]], "arlbench.core.algorithms.ppo": [[20, "module-arlbench.core.algorithms.ppo", false], [46, "module-arlbench.core.algorithms.ppo", false]], "arlbench.core.algorithms.ppo.models": [[21, "module-arlbench.core.algorithms.ppo.models", false], [46, "module-arlbench.core.algorithms.ppo.models", false]], "arlbench.core.algorithms.ppo.ppo": [[22, "module-arlbench.core.algorithms.ppo.ppo", false], [46, "module-arlbench.core.algorithms.ppo.ppo", false]], "arlbench.core.algorithms.prioritised_item_buffer": [[23, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [44, "module-arlbench.core.algorithms.prioritised_item_buffer", false]], "arlbench.core.algorithms.sac": [[24, "module-arlbench.core.algorithms.sac", false], [47, "module-arlbench.core.algorithms.sac", false]], "arlbench.core.algorithms.sac.models": [[25, "module-arlbench.core.algorithms.sac.models", false], [47, "module-arlbench.core.algorithms.sac.models", false]], "arlbench.core.algorithms.sac.sac": [[26, "module-arlbench.core.algorithms.sac.sac", false], [47, "module-arlbench.core.algorithms.sac.sac", false]], "arlbench.core.environments": [[27, "module-arlbench.core.environments", false], [48, "module-arlbench.core.environments", false]], "arlbench.core.environments.autorl_env": [[28, "module-arlbench.core.environments.autorl_env", false], [48, "module-arlbench.core.environments.autorl_env", false]], "arlbench.core.environments.brax_env": [[29, "module-arlbench.core.environments.brax_env", false], [48, "module-arlbench.core.environments.brax_env", false]], "arlbench.core.environments.envpool_env": [[30, "module-arlbench.core.environments.envpool_env", false], [48, "module-arlbench.core.environments.envpool_env", false]], "arlbench.core.environments.gymnasium_env": [[31, "module-arlbench.core.environments.gymnasium_env", false], [48, "module-arlbench.core.environments.gymnasium_env", false]], "arlbench.core.environments.gymnax_env": [[32, "module-arlbench.core.environments.gymnax_env", false], [48, "module-arlbench.core.environments.gymnax_env", false]], "arlbench.core.environments.make_env": [[48, "module-arlbench.core.environments.make_env", false]], "arlbench.core.environments.xland_env": [[34, "module-arlbench.core.environments.xland_env", false], [48, "module-arlbench.core.environments.xland_env", false]], "arlbench.core.running_statistics": [[35, "module-arlbench.core.running_statistics", false], [43, "module-arlbench.core.running_statistics", false]], "arlbench.core.wrappers": [[36, "module-arlbench.core.wrappers", false], [49, "module-arlbench.core.wrappers", false]], "arlbench.core.wrappers.flatten_observation": [[37, "module-arlbench.core.wrappers.flatten_observation", false], [49, "module-arlbench.core.wrappers.flatten_observation", false]], "arlbench.core.wrappers.wrapper": [[38, "module-arlbench.core.wrappers.wrapper", false], [49, "module-arlbench.core.wrappers.wrapper", false]], "arlbench.utils": [[39, "module-arlbench.utils", false], [50, "module-arlbench.utils", false]], "arlbench.utils.common": [[40, "module-arlbench.utils.common", false], [50, "module-arlbench.utils.common", false]], "automl": [[58, "term-AutoML", true]], "autorl": [[58, "term-AutoRL", true]], "autorlenv (class in arlbench)": [[5, "arlbench.AutoRLEnv", false], [41, "arlbench.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl)": [[7, "arlbench.autorl.AutoRLEnv", false], [42, "arlbench.autorl.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl.autorl_env)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv", false]], "bo": [[58, "term-BO", true]], "braxenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.BraxEnv", false], [48, "arlbench.core.environments.BraxEnv", false]], "braxenv (class in arlbench.core.environments.brax_env)": [[29, "arlbench.core.environments.brax_env.BraxEnv", false], [48, "arlbench.core.environments.brax_env.BraxEnv", false]], "buffer_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false], [45, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[20, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false], [46, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false], [47, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sacstate attribute)": [[24, "arlbench.core.algorithms.sac.SACState.buffer_state", false], [47, "arlbench.core.algorithms.sac.SACState.buffer_state", false]], "checkpointer (class in arlbench.autorl.checkpointing)": [[9, "arlbench.autorl.checkpointing.Checkpointer", false], [42, "arlbench.autorl.checkpointing.Checkpointer", false]], "checkpoints (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.checkpoints", false], [42, "arlbench.autorl.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.checkpoints", false], [41, "arlbench.AutoRLEnv.checkpoints", false]], "cnnactorcritic (class in arlbench.core.algorithms.ppo.models)": [[21, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false], [46, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false]], "cnnq (class in arlbench.core.algorithms.dqn.models)": [[19, "arlbench.core.algorithms.dqn.models.CNNQ", false], [45, "arlbench.core.algorithms.dqn.models.CNNQ", false]], "config (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.config", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.config", false]], "config (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.config", false], [42, "arlbench.autorl.AutoRLEnv.config", false]], "config (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.config", false], [41, "arlbench.AutoRLEnv.config", false]], "config_space (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false]], "config_space (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.config_space", false], [42, "arlbench.autorl.AutoRLEnv.config_space", false]], "config_space (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.config_space", false], [41, "arlbench.AutoRLEnv.config_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils)": [[39, "arlbench.utils.config_space_to_gymnasium_space", false], [50, "arlbench.utils.config_space_to_gymnasium_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.config_space_to_gymnasium_space", false], [50, "arlbench.utils.common.config_space_to_gymnasium_space", false]], "config_space_to_yaml() (in module arlbench.utils)": [[39, "arlbench.utils.config_space_to_yaml", false], [50, "arlbench.utils.config_space_to_yaml", false]], "config_space_to_yaml() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.config_space_to_yaml", false], [50, "arlbench.utils.common.config_space_to_yaml", false]], "count (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[43, "arlbench.core.running_statistics.RunningStatisticsState.count", false]], "create_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[23, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false], [44, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false]], "create_with_opt_state() (arlbench.core.algorithms.dqn.dqn.dqntrainstate class method)": [[45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.ppo.ppo.ppotrainstate class method)": [[46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.sac.sac.sactrainstate class method)": [[47, "arlbench.core.algorithms.sac.sac.SACTrainState.create_with_opt_state", false]], "critic (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.critic", false]], "critic_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false]], "critic_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false], [47, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false]], "critic_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false]], "critic_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false], [47, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false]], "critic_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false]], "critic_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false]], "cur_rewards (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false]], "cur_rewards (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false]], "denormalize() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.denormalize", false], [43, "arlbench.core.running_statistics.denormalize", false]], "discrete (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.discrete", false]], "discrete (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.discrete", false]], "done (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.done", false]], "done (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.done", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.done", false]], "done (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.done", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.done", false]], "done (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.done", false], [47, "arlbench.core.algorithms.sac.sac.Transition.done", false]], "dqn": [[58, "term-DQN", true]], "dqn (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.DQN", false], [44, "arlbench.core.algorithms.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQN", false], [45, "arlbench.core.algorithms.dqn.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false]], "dqnstate (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNState", false], [45, "arlbench.core.algorithms.dqn.DQNState", false]], "dqnstate (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNState", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNState", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false]], "dqntrainreturnt (in module arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false], [45, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false]], "dqntrainstate (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false]], "emissions (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.Emissions", false], [42, "arlbench.autorl.objectives.Emissions", false]], "env_name (arlbench.core.environments.autorl_env.environment property)": [[28, "arlbench.core.environments.autorl_env.Environment.env_name", false], [48, "arlbench.core.environments.autorl_env.Environment.env_name", false]], "env_name (arlbench.core.environments.environment property)": [[27, "arlbench.core.environments.Environment.env_name", false], [48, "arlbench.core.environments.Environment.env_name", false]], "env_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false]], "environment (class in arlbench.core.environments)": [[27, "arlbench.core.environments.Environment", false], [48, "arlbench.core.environments.Environment", false]], "environment (class in arlbench.core.environments.autorl_env)": [[28, "arlbench.core.environments.autorl_env.Environment", false], [48, "arlbench.core.environments.autorl_env.Environment", false]], "envpoolenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.EnvpoolEnv", false], [48, "arlbench.core.environments.EnvpoolEnv", false]], "envpoolenv (class in arlbench.core.environments.envpool_env)": [[30, "arlbench.core.environments.envpool_env.EnvpoolEnv", false], [48, "arlbench.core.environments.envpool_env.EnvpoolEnv", false]], "eval() (arlbench.autorl.autorl_env.autorlenv method)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false]], "eval() (arlbench.autorl.autorlenv method)": [[7, "arlbench.autorl.AutoRLEnv.eval", false], [42, "arlbench.autorl.AutoRLEnv.eval", false]], "eval() (arlbench.autorlenv method)": [[5, "arlbench.AutoRLEnv.eval", false], [41, "arlbench.AutoRLEnv.eval", false]], "eval() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.eval", false], [44, "arlbench.core.algorithms.Algorithm.eval", false]], "eval() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.eval", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.eval", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false]], "flattenobservationwrapper (class in arlbench.core.wrappers)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper", false]], "flattenobservationwrapper (class in arlbench.core.wrappers.flatten_observation)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false]], "from_tuple() (arlbench.core.algorithms.common.timestep method)": [[44, "arlbench.core.algorithms.common.TimeStep.from_tuple", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false], [45, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false], [46, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false], [47, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false], [44, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_default_hpo_config", false], [44, "arlbench.core.algorithms.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false], [45, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_default_hpo_config", false], [44, "arlbench.core.algorithms.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false], [46, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_default_hpo_config", false], [44, "arlbench.core.algorithms.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false], [47, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false], [44, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_default_nas_config", false], [44, "arlbench.core.algorithms.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false], [45, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_default_nas_config", false], [44, "arlbench.core.algorithms.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false], [46, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_default_nas_config", false], [44, "arlbench.core.algorithms.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false], [47, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false], [44, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_hpo_config_space", false], [44, "arlbench.core.algorithms.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false], [45, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_hpo_config_space", false], [44, "arlbench.core.algorithms.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false], [46, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_hpo_config_space", false], [44, "arlbench.core.algorithms.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false], [47, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false], [44, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_hpo_search_space", false], [44, "arlbench.core.algorithms.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false], [45, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_hpo_search_space", false], [44, "arlbench.core.algorithms.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false], [46, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_hpo_search_space", false], [44, "arlbench.core.algorithms.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false], [47, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false], [44, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_nas_config_space", false], [44, "arlbench.core.algorithms.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false], [45, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_nas_config_space", false], [44, "arlbench.core.algorithms.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false], [46, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_nas_config_space", false], [44, "arlbench.core.algorithms.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false], [47, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false]], "get_spec() (arlbench.autorl.objectives.emissions static method)": [[10, "arlbench.autorl.objectives.Emissions.get_spec", false], [42, "arlbench.autorl.objectives.Emissions.get_spec", false]], "get_spec() (arlbench.autorl.objectives.objective static method)": [[10, "arlbench.autorl.objectives.Objective.get_spec", false], [42, "arlbench.autorl.objectives.Objective.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardmean static method)": [[10, "arlbench.autorl.objectives.RewardMean.get_spec", false], [42, "arlbench.autorl.objectives.RewardMean.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardstd static method)": [[10, "arlbench.autorl.objectives.RewardStd.get_spec", false], [42, "arlbench.autorl.objectives.RewardStd.get_spec", false]], "get_spec() (arlbench.autorl.objectives.runtime static method)": [[10, "arlbench.autorl.objectives.Runtime.get_spec", false], [42, "arlbench.autorl.objectives.Runtime.get_spec", false]], "get_state_space() (arlbench.autorl.state_features.gradinfo static method)": [[11, "arlbench.autorl.state_features.GradInfo.get_state_space", false], [42, "arlbench.autorl.state_features.GradInfo.get_state_space", false]], "get_state_space() (arlbench.autorl.state_features.statefeature static method)": [[11, "arlbench.autorl.state_features.StateFeature.get_state_space", false], [42, "arlbench.autorl.state_features.StateFeature.get_state_space", false]], "global_step (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false]], "gradinfo (class in arlbench.autorl.state_features)": [[11, "arlbench.autorl.state_features.GradInfo", false], [42, "arlbench.autorl.state_features.GradInfo", false]], "grads (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppometrics attribute)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils)": [[39, "arlbench.utils.gymnasium_space_to_gymnax_space", false], [50, "arlbench.utils.gymnasium_space_to_gymnax_space", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false], [50, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false]], "gymnasiumenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.GymnasiumEnv", false], [48, "arlbench.core.environments.GymnasiumEnv", false]], "gymnasiumenv (class in arlbench.core.environments.gymnasium_env)": [[31, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false], [48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false]], "gymnaxenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.GymnaxEnv", false], [48, "arlbench.core.environments.GymnaxEnv", false]], "gymnaxenv (class in arlbench.core.environments.gymnax_env)": [[32, "arlbench.core.environments.gymnax_env.GymnaxEnv", false], [48, "arlbench.core.environments.gymnax_env.GymnaxEnv", false]], "hidden_size (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.hidden_size", false]], "hpo": [[58, "term-HPO", true]], "hpo_config (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.hpo_config", false], [42, "arlbench.autorl.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.hpo_config", false], [41, "arlbench.AutoRLEnv.hpo_config", false]], "info (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.info", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.info", false]], "info (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.info", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.info", false]], "info (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.info", false], [47, "arlbench.core.algorithms.sac.sac.Transition.info", false]], "init() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.init", false], [44, "arlbench.core.algorithms.Algorithm.init", false]], "init() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.init", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.init", false]], "init() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.init", false], [44, "arlbench.core.algorithms.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.init", false], [45, "arlbench.core.algorithms.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.init", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.ppo method)": [[13, "arlbench.core.algorithms.PPO.init", false], [44, "arlbench.core.algorithms.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo method)": [[20, "arlbench.core.algorithms.ppo.PPO.init", false], [46, "arlbench.core.algorithms.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.init", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.init", false], [44, "arlbench.core.algorithms.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.init", false], [47, "arlbench.core.algorithms.sac.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.init", false], [47, "arlbench.core.algorithms.sac.sac.SAC.init", false]], "init_state() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.init_state", false], [43, "arlbench.core.running_statistics.init_state", false]], "items() (arlbench.core.algorithms.common.timestep method)": [[16, "arlbench.core.algorithms.common.TimeStep.items", false], [44, "arlbench.core.algorithms.common.TimeStep.items", false]], "key (arlbench.autorl.objectives.emissions attribute)": [[42, "arlbench.autorl.objectives.Emissions.KEY", false]], "key (arlbench.autorl.objectives.objective attribute)": [[42, "arlbench.autorl.objectives.Objective.KEY", false]], "key (arlbench.autorl.objectives.rewardmean attribute)": [[42, "arlbench.autorl.objectives.RewardMean.KEY", false]], "key (arlbench.autorl.objectives.rewardstd attribute)": [[42, "arlbench.autorl.objectives.RewardStd.KEY", false]], "key (arlbench.autorl.objectives.runtime attribute)": [[42, "arlbench.autorl.objectives.Runtime.KEY", false]], "key (arlbench.autorl.state_features.gradinfo attribute)": [[42, "arlbench.autorl.state_features.GradInfo.KEY", false]], "key (arlbench.autorl.state_features.statefeature attribute)": [[42, "arlbench.autorl.state_features.StateFeature.KEY", false]], "keys() (arlbench.core.algorithms.common.timestep method)": [[16, "arlbench.core.algorithms.common.TimeStep.keys", false], [44, "arlbench.core.algorithms.common.TimeStep.keys", false]], "last_obs (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.last_obs", false]], "load() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.load", false], [42, "arlbench.autorl.checkpointing.Checkpointer.load", false]], "load_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false], [42, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false]], "log_prob (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false]], "log_std_max (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_max", false]], "log_std_max (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_max", false]], "log_std_min (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_min", false]], "log_std_min (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_min", false]], "loss (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppometrics attribute)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false]], "make_env() (in module arlbench.core.environments)": [[27, "arlbench.core.environments.make_env", false], [33, "arlbench.core.environments.make_env", false], [48, "arlbench.core.environments.make_env", false]], "make_env() (in module arlbench.core.environments.make_env)": [[48, "arlbench.core.environments.make_env.make_env", false]], "make_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[23, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false], [44, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false]], "mean (arlbench.core.running_statistics.nestedmeanstd attribute)": [[43, "arlbench.core.running_statistics.NestedMeanStd.mean", false]], "metrics (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false]], "mlpactorcritic (class in arlbench.core.algorithms.ppo.models)": [[21, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false], [46, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false]], "mlpq (class in arlbench.core.algorithms.dqn.models)": [[19, "arlbench.core.algorithms.dqn.models.MLPQ", false], [45, "arlbench.core.algorithms.dqn.models.MLPQ", false]], "mode() (arlbench.core.algorithms.sac.models.tanhtransformeddistribution method)": [[25, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false], [47, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false]], "module": [[5, "module-arlbench", false], [6, "module-arlbench.arlbench", false], [7, "module-arlbench.autorl", false], [8, "module-arlbench.autorl.autorl_env", false], [9, "module-arlbench.autorl.checkpointing", false], [10, "module-arlbench.autorl.objectives", false], [11, "module-arlbench.autorl.state_features", false], [12, "module-arlbench.core", false], [13, "module-arlbench.core.algorithms", false], [14, "module-arlbench.core.algorithms.algorithm", false], [15, "module-arlbench.core.algorithms.buffers", false], [16, "module-arlbench.core.algorithms.common", false], [17, "module-arlbench.core.algorithms.dqn", false], [18, "module-arlbench.core.algorithms.dqn.dqn", false], [19, "module-arlbench.core.algorithms.dqn.models", false], [20, "module-arlbench.core.algorithms.ppo", false], [21, "module-arlbench.core.algorithms.ppo.models", false], [22, "module-arlbench.core.algorithms.ppo.ppo", false], [23, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [24, "module-arlbench.core.algorithms.sac", false], [25, "module-arlbench.core.algorithms.sac.models", false], [26, "module-arlbench.core.algorithms.sac.sac", false], [27, "module-arlbench.core.environments", false], [28, "module-arlbench.core.environments.autorl_env", false], [29, "module-arlbench.core.environments.brax_env", false], [30, "module-arlbench.core.environments.envpool_env", false], [31, "module-arlbench.core.environments.gymnasium_env", false], [32, "module-arlbench.core.environments.gymnax_env", false], [34, "module-arlbench.core.environments.xland_env", false], [35, "module-arlbench.core.running_statistics", false], [36, "module-arlbench.core.wrappers", false], [37, "module-arlbench.core.wrappers.flatten_observation", false], [38, "module-arlbench.core.wrappers.wrapper", false], [39, "module-arlbench.utils", false], [40, "module-arlbench.utils.common", false], [41, "module-arlbench", false], [41, "module-arlbench.arlbench", false], [42, "module-arlbench.autorl", false], [42, "module-arlbench.autorl.autorl_env", false], [42, "module-arlbench.autorl.checkpointing", false], [42, "module-arlbench.autorl.objectives", false], [42, "module-arlbench.autorl.state_features", false], [43, "module-arlbench.core", false], [43, "module-arlbench.core.running_statistics", false], [44, "module-arlbench.core.algorithms", false], [44, "module-arlbench.core.algorithms.algorithm", false], [44, "module-arlbench.core.algorithms.buffers", false], [44, "module-arlbench.core.algorithms.common", false], [44, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [45, "module-arlbench.core.algorithms.dqn", false], [45, "module-arlbench.core.algorithms.dqn.dqn", false], [45, "module-arlbench.core.algorithms.dqn.models", false], [46, "module-arlbench.core.algorithms.ppo", false], [46, "module-arlbench.core.algorithms.ppo.models", false], [46, "module-arlbench.core.algorithms.ppo.ppo", false], [47, "module-arlbench.core.algorithms.sac", false], [47, "module-arlbench.core.algorithms.sac.models", false], [47, "module-arlbench.core.algorithms.sac.sac", false], [48, "module-arlbench.core.environments", false], [48, "module-arlbench.core.environments.autorl_env", false], [48, "module-arlbench.core.environments.brax_env", false], [48, "module-arlbench.core.environments.envpool_env", false], [48, "module-arlbench.core.environments.gymnasium_env", false], [48, "module-arlbench.core.environments.gymnax_env", false], [48, "module-arlbench.core.environments.make_env", false], [48, "module-arlbench.core.environments.xland_env", false], [49, "module-arlbench.core.wrappers", false], [49, "module-arlbench.core.wrappers.flatten_observation", false], [49, "module-arlbench.core.wrappers.wrapper", false], [50, "module-arlbench.utils", false], [50, "module-arlbench.utils.common", false]], "mrp_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[42, "arlbench.autorl.checkpointing.Checkpointer.MRP_FILE", false]], "multi-fidelity optimization": [[58, "term-Multi-fidelity-optimization", true]], "n_critics (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.n_critics", false]], "n_envs (arlbench.core.environments.autorl_env.environment property)": [[28, "arlbench.core.environments.autorl_env.Environment.n_envs", false], [48, "arlbench.core.environments.autorl_env.Environment.n_envs", false]], "n_envs (arlbench.core.environments.environment property)": [[27, "arlbench.core.environments.Environment.n_envs", false], [48, "arlbench.core.environments.Environment.n_envs", false]], "name (arlbench.core.algorithms.algorithm attribute)": [[44, "arlbench.core.algorithms.Algorithm.name", false]], "name (arlbench.core.algorithms.algorithm.algorithm attribute)": [[44, "arlbench.core.algorithms.algorithm.Algorithm.name", false]], "name (arlbench.core.algorithms.dqn attribute)": [[44, "arlbench.core.algorithms.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn attribute)": [[45, "arlbench.core.algorithms.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn.dqn attribute)": [[45, "arlbench.core.algorithms.dqn.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.name", false]], "name (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.name", false]], "name (arlbench.core.algorithms.ppo attribute)": [[44, "arlbench.core.algorithms.PPO.name", false]], "name (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.ppo attribute)": [[46, "arlbench.core.algorithms.ppo.PPO.name", false]], "name (arlbench.core.algorithms.ppo.ppo.ppo attribute)": [[46, "arlbench.core.algorithms.ppo.ppo.PPO.name", false]], "name (arlbench.core.algorithms.sac attribute)": [[44, "arlbench.core.algorithms.SAC.name", false]], "name (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.name", false]], "name (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.name", false]], "name (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.name", false]], "name (arlbench.core.algorithms.sac.sac attribute)": [[47, "arlbench.core.algorithms.sac.SAC.name", false]], "name (arlbench.core.algorithms.sac.sac.sac attribute)": [[47, "arlbench.core.algorithms.sac.sac.SAC.name", false]], "nestedmeanstd (class in arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.NestedMeanStd", false], [43, "arlbench.core.running_statistics.NestedMeanStd", false]], "network_state (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[47, "arlbench.core.algorithms.sac.sac.SACTrainState.network_state", false]], "nodes_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[42, "arlbench.autorl.checkpointing.Checkpointer.NODES_FILE", false]], "normalize() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.normalize", false], [43, "arlbench.core.running_statistics.normalize", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false]], "numpy_to_jax() (in module arlbench.core.environments.envpool_env)": [[30, "arlbench.core.environments.envpool_env.numpy_to_jax", false], [48, "arlbench.core.environments.envpool_env.numpy_to_jax", false]], "objective (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.Objective", false], [42, "arlbench.autorl.objectives.Objective", false]], "objectives (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false]], "objectives (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.objectives", false], [42, "arlbench.autorl.AutoRLEnv.objectives", false]], "objectives (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.objectives", false], [41, "arlbench.AutoRLEnv.objectives", false]], "obs (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false]], "obs (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false]], "obs (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.obs", false], [47, "arlbench.core.algorithms.sac.sac.Transition.obs", false]], "obs (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.obs", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.obs", false]], "observation_space (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.observation_space", false], [42, "arlbench.autorl.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.observation_space", false], [41, "arlbench.AutoRLEnv.observation_space", false]], "observation_space (arlbench.core.environments.brax_env.braxenv property)": [[29, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false], [48, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.braxenv property)": [[27, "arlbench.core.environments.BraxEnv.observation_space", false], [48, "arlbench.core.environments.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[30, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false], [48, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpoolenv property)": [[27, "arlbench.core.environments.EnvpoolEnv.observation_space", false], [48, "arlbench.core.environments.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[31, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false], [48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasiumenv property)": [[27, "arlbench.core.environments.GymnasiumEnv.observation_space", false], [48, "arlbench.core.environments.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[32, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false], [48, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnaxenv property)": [[27, "arlbench.core.environments.GymnaxEnv.observation_space", false], [48, "arlbench.core.environments.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.xland_env.xlandenv property)": [[34, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false], [48, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false]], "observation_space (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper property)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false]], "observation_space (arlbench.core.wrappers.flattenobservationwrapper property)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false]], "observation_space() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.observation_space", false], [48, "arlbench.core.environments.autorl_env.Environment.observation_space", false]], "observation_space() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.observation_space", false], [48, "arlbench.core.environments.Environment.observation_space", false]], "opt_state (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.opt_state", false]], "opt_state (arlbench.core.algorithms.ppo.ppo.ppotrainstate attribute)": [[46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.opt_state", false]], "parent (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.parent", false]], "parent (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.parent", false]], "parent (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.parent", false]], "parent (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.parent", false]], "ppo": [[58, "term-PPO", true]], "ppo (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.PPO", false], [44, "arlbench.core.algorithms.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPO", false], [46, "arlbench.core.algorithms.ppo.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO", false]], "ppometrics (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics", false]], "ppometrics (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false]], "ppostate (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOState", false], [46, "arlbench.core.algorithms.ppo.PPOState", false]], "ppostate (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOState", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOState", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false]], "ppotrainreturnt (in module arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false], [46, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false]], "ppotrainstate (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false]], "predict() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.predict", false], [44, "arlbench.core.algorithms.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.predict", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.predict", false], [44, "arlbench.core.algorithms.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.predict", false], [45, "arlbench.core.algorithms.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.ppo method)": [[13, "arlbench.core.algorithms.PPO.predict", false], [44, "arlbench.core.algorithms.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo method)": [[20, "arlbench.core.algorithms.ppo.PPO.predict", false], [46, "arlbench.core.algorithms.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.predict", false], [44, "arlbench.core.algorithms.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.predict", false], [47, "arlbench.core.algorithms.sac.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.predict", false], [47, "arlbench.core.algorithms.sac.sac.SAC.predict", false]], "random search": [[58, "term-Random-Search", true]], "rank (arlbench.autorl.objectives.emissions attribute)": [[42, "arlbench.autorl.objectives.Emissions.RANK", false]], "rank (arlbench.autorl.objectives.objective attribute)": [[42, "arlbench.autorl.objectives.Objective.RANK", false]], "rank (arlbench.autorl.objectives.rewardmean attribute)": [[42, "arlbench.autorl.objectives.RewardMean.RANK", false]], "rank (arlbench.autorl.objectives.rewardstd attribute)": [[42, "arlbench.autorl.objectives.RewardStd.RANK", false]], "rank (arlbench.autorl.objectives.runtime attribute)": [[42, "arlbench.autorl.objectives.Runtime.RANK", false]], "recursive_concat() (in module arlbench.utils)": [[39, "arlbench.utils.recursive_concat", false], [50, "arlbench.utils.recursive_concat", false]], "recursive_concat() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.recursive_concat", false], [50, "arlbench.utils.common.recursive_concat", false]], "replace() (arlbench.core.algorithms.common.timestep method)": [[44, "arlbench.core.algorithms.common.TimeStep.replace", false]], "replace() (arlbench.core.algorithms.dqn.dqn.dqntrainstate method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false]], "replace() (arlbench.core.algorithms.ppo.ppo.ppotrainstate method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false]], "replace() (arlbench.core.algorithms.sac.sac.sactrainstate method)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false]], "replace() (arlbench.core.running_statistics.nestedmeanstd method)": [[35, "arlbench.core.running_statistics.NestedMeanStd.replace", false], [43, "arlbench.core.running_statistics.NestedMeanStd.replace", false]], "replace() (arlbench.core.running_statistics.runningstatisticsstate method)": [[35, "arlbench.core.running_statistics.RunningStatisticsState.replace", false], [43, "arlbench.core.running_statistics.RunningStatisticsState.replace", false]], "reset() (arlbench.autorl.autorl_env.autorlenv method)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false]], "reset() (arlbench.autorl.autorlenv method)": [[7, "arlbench.autorl.AutoRLEnv.reset", false], [42, "arlbench.autorl.AutoRLEnv.reset", false]], "reset() (arlbench.autorlenv method)": [[5, "arlbench.AutoRLEnv.reset", false], [41, "arlbench.AutoRLEnv.reset", false]], "reset() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.reset", false], [48, "arlbench.core.environments.autorl_env.Environment.reset", false]], "reset() (arlbench.core.environments.brax_env.braxenv method)": [[48, "arlbench.core.environments.brax_env.BraxEnv.reset", false]], "reset() (arlbench.core.environments.braxenv method)": [[48, "arlbench.core.environments.BraxEnv.reset", false]], "reset() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.reset", false], [48, "arlbench.core.environments.Environment.reset", false]], "reset() (arlbench.core.environments.envpool_env.envpoolenv method)": [[48, "arlbench.core.environments.envpool_env.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.envpoolenv method)": [[48, "arlbench.core.environments.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnasiumenv method)": [[48, "arlbench.core.environments.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[48, "arlbench.core.environments.gymnax_env.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.gymnaxenv method)": [[48, "arlbench.core.environments.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.xland_env.xlandenv method)": [[48, "arlbench.core.environments.xland_env.XLandEnv.reset", false]], "reset() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false]], "reset() (arlbench.core.wrappers.flattenobservationwrapper method)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false]], "return_buffer (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false]], "return_buffer (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false]], "reward (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.reward", false]], "reward (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false]], "reward (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false]], "reward (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.reward", false], [47, "arlbench.core.algorithms.sac.sac.Transition.reward", false]], "rewardmean (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.RewardMean", false], [42, "arlbench.autorl.objectives.RewardMean", false]], "rewardstd (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.RewardStd", false], [42, "arlbench.autorl.objectives.RewardStd", false]], "rng (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.rng", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.rng", false]], "run_arlbench() (in module arlbench)": [[5, "arlbench.run_arlbench", false], [41, "arlbench.run_arlbench", false]], "run_arlbench() (in module arlbench.arlbench)": [[6, "arlbench.arlbench.run_arlbench", false], [41, "arlbench.arlbench.run_arlbench", false]], "runner_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNState.runner_state", false], [45, "arlbench.core.algorithms.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[20, "arlbench.core.algorithms.ppo.PPOState.runner_state", false], [46, "arlbench.core.algorithms.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false], [47, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sacstate attribute)": [[24, "arlbench.core.algorithms.sac.SACState.runner_state", false], [47, "arlbench.core.algorithms.sac.SACState.runner_state", false]], "runningstatisticsstate (class in arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.RunningStatisticsState", false], [43, "arlbench.core.running_statistics.RunningStatisticsState", false]], "runtime (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.Runtime", false], [42, "arlbench.autorl.objectives.Runtime", false]], "sac": [[58, "term-SAC", true]], "sac (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.SAC", false], [44, "arlbench.core.algorithms.SAC", false]], "sac (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SAC", false], [47, "arlbench.core.algorithms.sac.SAC", false]], "sac (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SAC", false], [47, "arlbench.core.algorithms.sac.sac.SAC", false]], "saccnnactor (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACCNNActor", false], [47, "arlbench.core.algorithms.sac.models.SACCNNActor", false]], "saccnncritic (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACCNNCritic", false], [47, "arlbench.core.algorithms.sac.models.SACCNNCritic", false]], "sacmetrics (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACMetrics", false], [47, "arlbench.core.algorithms.sac.SACMetrics", false]], "sacmetrics (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics", false]], "sacmlpactor (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACMLPActor", false], [47, "arlbench.core.algorithms.sac.models.SACMLPActor", false]], "sacmlpcritic (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACMLPCritic", false], [47, "arlbench.core.algorithms.sac.models.SACMLPCritic", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACRunnerState", false], [47, "arlbench.core.algorithms.sac.SACRunnerState", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState", false]], "sacstate (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACState", false], [47, "arlbench.core.algorithms.sac.SACState", false]], "sacstate (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACState", false], [47, "arlbench.core.algorithms.sac.sac.SACState", false]], "sactrainingresult (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult", false]], "sactrainingresult (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false]], "sactrainreturnt (in module arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACTrainReturnT", false], [47, "arlbench.core.algorithms.sac.SACTrainReturnT", false]], "sactrainstate (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainState", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainState", false]], "sacvectorcritic (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACVectorCritic", false], [47, "arlbench.core.algorithms.sac.models.SACVectorCritic", false]], "sample_action() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[48, "arlbench.core.environments.gymnax_env.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.gymnaxenv method)": [[48, "arlbench.core.environments.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.xland_env.xlandenv method)": [[48, "arlbench.core.environments.xland_env.XLandEnv.sample_action", false]], "sample_actions() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.sample_actions", false], [48, "arlbench.core.environments.autorl_env.Environment.sample_actions", false]], "sample_actions() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.sample_actions", false], [48, "arlbench.core.environments.Environment.sample_actions", false]], "save() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.save", false], [42, "arlbench.autorl.checkpointing.Checkpointer.save", false]], "save_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false], [42, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false]], "save_defaults_to_yaml() (in module arlbench.utils)": [[39, "arlbench.utils.save_defaults_to_yaml", false], [50, "arlbench.utils.save_defaults_to_yaml", false]], "save_defaults_to_yaml() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.save_defaults_to_yaml", false], [50, "arlbench.utils.common.save_defaults_to_yaml", false]], "scalars_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[42, "arlbench.autorl.checkpointing.Checkpointer.SCALARS_FILE", false]], "scope (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.scope", false]], "scope (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.scope", false]], "scope (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.scope", false]], "scope (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.scope", false]], "setup() (arlbench.core.algorithms.dqn.models.cnnq method)": [[19, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false], [45, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false]], "setup() (arlbench.core.algorithms.dqn.models.mlpq method)": [[19, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false], [45, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false], [46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false], [46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.alphacoef method)": [[25, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false], [47, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false], [47, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false], [47, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false], [47, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false], [47, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false]], "statefeature (class in arlbench.autorl.state_features)": [[11, "arlbench.autorl.state_features.StateFeature", false], [42, "arlbench.autorl.state_features.StateFeature", false]], "std (arlbench.core.running_statistics.nestedmeanstd attribute)": [[43, "arlbench.core.running_statistics.NestedMeanStd.std", false]], "step() (arlbench.autorl.autorl_env.autorlenv method)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.step", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.step", false]], "step() (arlbench.autorl.autorlenv method)": [[7, "arlbench.autorl.AutoRLEnv.step", false], [42, "arlbench.autorl.AutoRLEnv.step", false]], "step() (arlbench.autorlenv method)": [[5, "arlbench.AutoRLEnv.step", false], [41, "arlbench.AutoRLEnv.step", false]], "step() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.step", false], [48, "arlbench.core.environments.autorl_env.Environment.step", false]], "step() (arlbench.core.environments.brax_env.braxenv method)": [[48, "arlbench.core.environments.brax_env.BraxEnv.step", false]], "step() (arlbench.core.environments.braxenv method)": [[48, "arlbench.core.environments.BraxEnv.step", false]], "step() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.step", false], [48, "arlbench.core.environments.Environment.step", false]], "step() (arlbench.core.environments.envpool_env.envpoolenv method)": [[48, "arlbench.core.environments.envpool_env.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.envpoolenv method)": [[48, "arlbench.core.environments.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnasiumenv method)": [[48, "arlbench.core.environments.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[48, "arlbench.core.environments.gymnax_env.GymnaxEnv.step", false]], "step() (arlbench.core.environments.gymnaxenv method)": [[48, "arlbench.core.environments.GymnaxEnv.step", false]], "step() (arlbench.core.environments.xland_env.xlandenv method)": [[48, "arlbench.core.environments.xland_env.XLandEnv.step", false]], "step() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false]], "step() (arlbench.core.wrappers.flattenobservationwrapper method)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper.step", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper.step", false]], "summed_variance (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[43, "arlbench.core.running_statistics.RunningStatisticsState.summed_variance", false]], "tanhtransformeddistribution (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false], [47, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false]], "target_params (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.target_params", false]], "target_params (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[47, "arlbench.core.algorithms.sac.sac.SACTrainState.target_params", false]], "td_error (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.td_error", false], [47, "arlbench.core.algorithms.sac.SACMetrics.td_error", false]], "timestep (class in arlbench.core.algorithms.common)": [[16, "arlbench.core.algorithms.common.TimeStep", false], [44, "arlbench.core.algorithms.common.TimeStep", false]], "to_tuple() (arlbench.core.algorithms.common.timestep method)": [[44, "arlbench.core.algorithms.common.TimeStep.to_tuple", false]], "train() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.train", false], [44, "arlbench.core.algorithms.Algorithm.train", false]], "train() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.train", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.train", false]], "train() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.train", false], [44, "arlbench.core.algorithms.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.train", false], [45, "arlbench.core.algorithms.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.train", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.ppo method)": [[13, "arlbench.core.algorithms.PPO.train", false], [44, "arlbench.core.algorithms.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo method)": [[20, "arlbench.core.algorithms.ppo.PPO.train", false], [46, "arlbench.core.algorithms.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.train", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.train", false], [44, "arlbench.core.algorithms.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.train", false], [47, "arlbench.core.algorithms.sac.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.train", false], [47, "arlbench.core.algorithms.sac.sac.SAC.train", false]], "train_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false]], "trajectories (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false]], "transition (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition", false]], "transition (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition", false]], "transition (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.Transition", false], [47, "arlbench.core.algorithms.sac.sac.Transition", false]], "tuple_concat() (in module arlbench.utils)": [[39, "arlbench.utils.tuple_concat", false], [50, "arlbench.utils.tuple_concat", false]], "tuple_concat() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.tuple_concat", false], [50, "arlbench.utils.common.tuple_concat", false]], "uniform_sample() (in module arlbench.core.algorithms.buffers)": [[15, "arlbench.core.algorithms.buffers.uniform_sample", false], [44, "arlbench.core.algorithms.buffers.uniform_sample", false]], "update() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.update", false], [44, "arlbench.core.algorithms.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.update", false], [45, "arlbench.core.algorithms.dqn.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.update", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.update", false]], "update() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.update", false], [43, "arlbench.core.running_statistics.update", false]], "update_actor() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.update_actor", false], [44, "arlbench.core.algorithms.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.update_actor", false], [47, "arlbench.core.algorithms.sac.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false], [47, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false]], "update_alpha() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.update_alpha", false], [44, "arlbench.core.algorithms.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.update_alpha", false], [47, "arlbench.core.algorithms.sac.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false], [47, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false]], "update_critic() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.update_critic", false], [44, "arlbench.core.algorithms.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.update_critic", false], [47, "arlbench.core.algorithms.sac.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false], [47, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.update_hpo_config", false], [44, "arlbench.core.algorithms.Algorithm.update_hpo_config", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false]], "value (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.value", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.value", false]], "value (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.value", false], [47, "arlbench.core.algorithms.sac.sac.Transition.value", false]], "values() (arlbench.core.algorithms.common.timestep method)": [[16, "arlbench.core.algorithms.common.TimeStep.values", false], [44, "arlbench.core.algorithms.common.TimeStep.values", false]], "wrapper (class in arlbench.core.wrappers)": [[36, "arlbench.core.wrappers.Wrapper", false], [49, "arlbench.core.wrappers.Wrapper", false]], "wrapper (class in arlbench.core.wrappers.wrapper)": [[38, "arlbench.core.wrappers.wrapper.Wrapper", false], [49, "arlbench.core.wrappers.wrapper.Wrapper", false]], "xlandenv (class in arlbench.core.environments.xland_env)": [[34, "arlbench.core.environments.xland_env.XLandEnv", false], [48, "arlbench.core.environments.xland_env.XLandEnv", false]]}, "objects": {"": [[41, 0, 0, "-", "arlbench"]], "arlbench": [[41, 1, 1, "", "AutoRLEnv"], [41, 0, 0, "-", "arlbench"], [42, 0, 0, "-", "autorl"], [43, 0, 0, "-", "core"], [41, 5, 1, "", "run_arlbench"], [50, 0, 0, "-", "utils"]], "arlbench.AutoRLEnv": [[41, 2, 1, "", "ALGORITHMS"], [41, 3, 1, "", "action_space"], [41, 3, 1, "", "checkpoints"], [41, 3, 1, "", "config"], [41, 3, 1, "", "config_space"], [41, 4, 1, "", "eval"], [41, 3, 1, "", "hpo_config"], [41, 3, 1, "", "objectives"], [41, 3, 1, "", "observation_space"], [41, 4, 1, "", "reset"], [41, 4, 1, "", "step"]], "arlbench.arlbench": [[41, 5, 1, "", "run_arlbench"]], "arlbench.autorl": [[42, 1, 1, "", "AutoRLEnv"], [42, 0, 0, "-", "autorl_env"], [42, 0, 0, "-", "checkpointing"], [42, 0, 0, "-", "objectives"], [42, 0, 0, "-", "state_features"]], "arlbench.autorl.AutoRLEnv": [[42, 2, 1, "", "ALGORITHMS"], [42, 3, 1, "", "action_space"], [42, 3, 1, "", "checkpoints"], [42, 3, 1, "", "config"], [42, 3, 1, "", "config_space"], [42, 4, 1, "", "eval"], [42, 3, 1, "", "hpo_config"], [42, 3, 1, "", "objectives"], [42, 3, 1, "", "observation_space"], [42, 4, 1, "", "reset"], [42, 4, 1, "", "step"]], "arlbench.autorl.autorl_env": [[42, 1, 1, "", "AutoRLEnv"]], "arlbench.autorl.autorl_env.AutoRLEnv": [[42, 2, 1, "", "ALGORITHMS"], [42, 3, 1, "", "action_space"], [42, 3, 1, "", "checkpoints"], [42, 3, 1, "", "config"], [42, 3, 1, "", "config_space"], [42, 4, 1, "", "eval"], [42, 3, 1, "", "hpo_config"], [42, 3, 1, "", "objectives"], [42, 3, 1, "", "observation_space"], [42, 4, 1, "", "reset"], [42, 4, 1, "", "step"]], "arlbench.autorl.checkpointing": [[42, 1, 1, "", "Checkpointer"]], "arlbench.autorl.checkpointing.Checkpointer": [[42, 2, 1, "", "MRP_FILE"], [42, 2, 1, "", "NODES_FILE"], [42, 2, 1, "", "SCALARS_FILE"], [42, 4, 1, "", "load"], [42, 4, 1, "", "load_buffer"], [42, 4, 1, "", "save"], [42, 4, 1, "", "save_buffer"]], "arlbench.autorl.objectives": [[42, 1, 1, "", "Emissions"], [42, 1, 1, "", "Objective"], [42, 1, 1, "", "RewardMean"], [42, 1, 1, "", "RewardStd"], [42, 1, 1, "", "Runtime"]], "arlbench.autorl.objectives.Emissions": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Objective": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "__lt__"], [42, 4, 1, "", "__new__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardMean": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardStd": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Runtime": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.state_features": [[42, 1, 1, "", "GradInfo"], [42, 1, 1, "", "StateFeature"]], "arlbench.autorl.state_features.GradInfo": [[42, 2, 1, "", "KEY"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_state_space"]], "arlbench.autorl.state_features.StateFeature": [[42, 2, 1, "", "KEY"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "__new__"], [42, 4, 1, "", "get_state_space"]], "arlbench.core": [[44, 0, 0, "-", "algorithms"], [48, 0, 0, "-", "environments"], [43, 0, 0, "-", "running_statistics"], [49, 0, 0, "-", "wrappers"]], "arlbench.core.algorithms": [[44, 1, 1, "", "Algorithm"], [44, 1, 1, "", "DQN"], [44, 1, 1, "", "PPO"], [44, 1, 1, "", "SAC"], [44, 0, 0, "-", "algorithm"], [44, 0, 0, "-", "buffers"], [44, 0, 0, "-", "common"], [45, 0, 0, "-", "dqn"], [46, 0, 0, "-", "ppo"], [44, 0, 0, "-", "prioritised_item_buffer"], [47, 0, 0, "-", "sac"]], "arlbench.core.algorithms.Algorithm": [[44, 3, 1, "", "action_type"], [44, 4, 1, "", "eval"], [44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.DQN": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update"]], "arlbench.core.algorithms.PPO": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"]], "arlbench.core.algorithms.SAC": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_actor"], [44, 4, 1, "", "update_alpha"], [44, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.algorithm": [[44, 1, 1, "", "Algorithm"]], "arlbench.core.algorithms.algorithm.Algorithm": [[44, 3, 1, "", "action_type"], [44, 4, 1, "", "eval"], [44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.buffers": [[44, 5, 1, "", "uniform_sample"]], "arlbench.core.algorithms.common": [[44, 1, 1, "", "TimeStep"]], "arlbench.core.algorithms.common.TimeStep": [[44, 2, 1, "", "action"], [44, 2, 1, "", "done"], [44, 4, 1, "", "from_tuple"], [44, 4, 1, "", "items"], [44, 4, 1, "", "keys"], [44, 2, 1, "", "last_obs"], [44, 2, 1, "", "obs"], [44, 4, 1, "", "replace"], [44, 2, 1, "", "reward"], [44, 4, 1, "", "to_tuple"], [44, 4, 1, "", "values"]], "arlbench.core.algorithms.dqn": [[45, 1, 1, "", "DQN"], [45, 1, 1, "", "DQNMetrics"], [45, 1, 1, "", "DQNRunnerState"], [45, 1, 1, "", "DQNState"], [45, 2, 1, "", "DQNTrainReturnT"], [45, 1, 1, "", "DQNTrainingResult"], [45, 0, 0, "-", "dqn"], [45, 0, 0, "-", "models"]], "arlbench.core.algorithms.dqn.DQN": [[45, 4, 1, "", "get_checkpoint_factory"], [45, 4, 1, "", "get_default_hpo_config"], [45, 4, 1, "", "get_default_nas_config"], [45, 4, 1, "", "get_hpo_config_space"], [45, 4, 1, "", "get_hpo_search_space"], [45, 4, 1, "", "get_nas_config_space"], [45, 4, 1, "", "init"], [45, 2, 1, "", "name"], [45, 4, 1, "", "predict"], [45, 4, 1, "", "train"], [45, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.DQNMetrics": [[45, 2, 1, "", "grads"], [45, 2, 1, "", "loss"], [45, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.DQNRunnerState": [[45, 2, 1, "", "env_state"], [45, 2, 1, "", "global_step"], [45, 2, 1, "", "normalizer_state"], [45, 2, 1, "", "obs"], [45, 2, 1, "", "rng"], [45, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.DQNState": [[45, 2, 1, "", "buffer_state"], [45, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.DQNTrainingResult": [[45, 2, 1, "", "eval_rewards"], [45, 2, 1, "", "metrics"], [45, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn": [[45, 1, 1, "", "DQN"], [45, 1, 1, "", "DQNMetrics"], [45, 1, 1, "", "DQNRunnerState"], [45, 1, 1, "", "DQNState"], [45, 1, 1, "", "DQNTrainState"], [45, 1, 1, "", "DQNTrainingResult"], [45, 1, 1, "", "Transition"]], "arlbench.core.algorithms.dqn.dqn.DQN": [[45, 4, 1, "", "get_checkpoint_factory"], [45, 4, 1, "", "get_default_hpo_config"], [45, 4, 1, "", "get_default_nas_config"], [45, 4, 1, "", "get_hpo_config_space"], [45, 4, 1, "", "get_hpo_search_space"], [45, 4, 1, "", "get_nas_config_space"], [45, 4, 1, "", "init"], [45, 2, 1, "", "name"], [45, 4, 1, "", "predict"], [45, 4, 1, "", "train"], [45, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.dqn.DQNMetrics": [[45, 2, 1, "", "grads"], [45, 2, 1, "", "loss"], [45, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.dqn.DQNRunnerState": [[45, 2, 1, "", "env_state"], [45, 2, 1, "", "global_step"], [45, 2, 1, "", "normalizer_state"], [45, 2, 1, "", "obs"], [45, 2, 1, "", "rng"], [45, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.dqn.DQNState": [[45, 2, 1, "", "buffer_state"], [45, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainState": [[45, 4, 1, "", "create_with_opt_state"], [45, 2, 1, "", "opt_state"], [45, 4, 1, "", "replace"], [45, 2, 1, "", "target_params"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult": [[45, 2, 1, "", "eval_rewards"], [45, 2, 1, "", "metrics"], [45, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn.Transition": [[45, 2, 1, "", "action"], [45, 2, 1, "", "done"], [45, 2, 1, "", "info"], [45, 2, 1, "", "obs"], [45, 2, 1, "", "reward"]], "arlbench.core.algorithms.dqn.models": [[45, 1, 1, "", "CNNQ"], [45, 1, 1, "", "MLPQ"]], "arlbench.core.algorithms.dqn.models.CNNQ": [[45, 4, 1, "", "__call__"], [45, 2, 1, "", "action_dim"], [45, 2, 1, "", "activation"], [45, 2, 1, "", "discrete"], [45, 2, 1, "", "hidden_size"], [45, 2, 1, "", "name"], [45, 2, 1, "", "parent"], [45, 2, 1, "", "scope"], [45, 4, 1, "", "setup"]], "arlbench.core.algorithms.dqn.models.MLPQ": [[45, 4, 1, "", "__call__"], [45, 2, 1, "", "action_dim"], [45, 2, 1, "", "activation"], [45, 2, 1, "", "discrete"], [45, 2, 1, "", "hidden_size"], [45, 2, 1, "", "name"], [45, 2, 1, "", "parent"], [45, 2, 1, "", "scope"], [45, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo": [[46, 1, 1, "", "PPO"], [46, 1, 1, "", "PPOMetrics"], [46, 1, 1, "", "PPORunnerState"], [46, 1, 1, "", "PPOState"], [46, 2, 1, "", "PPOTrainReturnT"], [46, 1, 1, "", "PPOTrainingResult"], [46, 0, 0, "-", "models"], [46, 0, 0, "-", "ppo"]], "arlbench.core.algorithms.ppo.PPO": [[46, 4, 1, "", "get_checkpoint_factory"], [46, 4, 1, "", "get_default_hpo_config"], [46, 4, 1, "", "get_default_nas_config"], [46, 4, 1, "", "get_hpo_config_space"], [46, 4, 1, "", "get_hpo_search_space"], [46, 4, 1, "", "get_nas_config_space"], [46, 4, 1, "", "init"], [46, 2, 1, "", "name"], [46, 4, 1, "", "predict"], [46, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.PPOMetrics": [[46, 2, 1, "", "advantages"], [46, 2, 1, "", "grads"], [46, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.PPORunnerState": [[46, 2, 1, "", "cur_rewards"], [46, 2, 1, "", "env_state"], [46, 2, 1, "", "global_step"], [46, 2, 1, "", "normalizer_state"], [46, 2, 1, "", "obs"], [46, 2, 1, "", "return_buffer"], [46, 2, 1, "", "return_buffer_idx"], [46, 2, 1, "", "rng"], [46, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.PPOState": [[46, 2, 1, "", "buffer_state"], [46, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.PPOTrainingResult": [[46, 2, 1, "", "eval_rewards"], [46, 2, 1, "", "metrics"], [46, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.models": [[46, 1, 1, "", "CNNActorCritic"], [46, 1, 1, "", "MLPActorCritic"]], "arlbench.core.algorithms.ppo.models.CNNActorCritic": [[46, 4, 1, "", "__call__"], [46, 2, 1, "", "action_dim"], [46, 2, 1, "", "activation"], [46, 2, 1, "", "discrete"], [46, 2, 1, "", "hidden_size"], [46, 2, 1, "", "name"], [46, 2, 1, "", "parent"], [46, 2, 1, "", "scope"], [46, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.models.MLPActorCritic": [[46, 4, 1, "", "__call__"], [46, 2, 1, "", "action_dim"], [46, 2, 1, "", "activation"], [46, 2, 1, "", "discrete"], [46, 2, 1, "", "hidden_size"], [46, 2, 1, "", "name"], [46, 2, 1, "", "parent"], [46, 2, 1, "", "scope"], [46, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.ppo": [[46, 1, 1, "", "PPO"], [46, 1, 1, "", "PPOMetrics"], [46, 1, 1, "", "PPORunnerState"], [46, 1, 1, "", "PPOState"], [46, 1, 1, "", "PPOTrainState"], [46, 1, 1, "", "PPOTrainingResult"], [46, 1, 1, "", "Transition"]], "arlbench.core.algorithms.ppo.ppo.PPO": [[46, 4, 1, "", "get_checkpoint_factory"], [46, 4, 1, "", "get_default_hpo_config"], [46, 4, 1, "", "get_default_nas_config"], [46, 4, 1, "", "get_hpo_config_space"], [46, 4, 1, "", "get_hpo_search_space"], [46, 4, 1, "", "get_nas_config_space"], [46, 4, 1, "", "init"], [46, 2, 1, "", "name"], [46, 4, 1, "", "predict"], [46, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.ppo.PPOMetrics": [[46, 2, 1, "", "advantages"], [46, 2, 1, "", "grads"], [46, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.ppo.PPORunnerState": [[46, 2, 1, "", "cur_rewards"], [46, 2, 1, "", "env_state"], [46, 2, 1, "", "global_step"], [46, 2, 1, "", "normalizer_state"], [46, 2, 1, "", "obs"], [46, 2, 1, "", "return_buffer"], [46, 2, 1, "", "return_buffer_idx"], [46, 2, 1, "", "rng"], [46, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.ppo.PPOState": [[46, 2, 1, "", "buffer_state"], [46, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainState": [[46, 4, 1, "", "create_with_opt_state"], [46, 2, 1, "", "opt_state"], [46, 4, 1, "", "replace"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult": [[46, 2, 1, "", "eval_rewards"], [46, 2, 1, "", "metrics"], [46, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.ppo.Transition": [[46, 2, 1, "", "action"], [46, 2, 1, "", "done"], [46, 2, 1, "", "info"], [46, 2, 1, "", "log_prob"], [46, 2, 1, "", "obs"], [46, 2, 1, "", "reward"], [46, 2, 1, "", "value"]], "arlbench.core.algorithms.prioritised_item_buffer": [[44, 5, 1, "", "create_prioritised_item_buffer"], [44, 5, 1, "", "make_prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[47, 1, 1, "", "SAC"], [47, 1, 1, "", "SACMetrics"], [47, 1, 1, "", "SACRunnerState"], [47, 1, 1, "", "SACState"], [47, 2, 1, "", "SACTrainReturnT"], [47, 1, 1, "", "SACTrainingResult"], [47, 0, 0, "-", "models"], [47, 0, 0, "-", "sac"]], "arlbench.core.algorithms.sac.SAC": [[47, 4, 1, "", "get_checkpoint_factory"], [47, 4, 1, "", "get_default_hpo_config"], [47, 4, 1, "", "get_default_nas_config"], [47, 4, 1, "", "get_hpo_config_space"], [47, 4, 1, "", "get_hpo_search_space"], [47, 4, 1, "", "get_nas_config_space"], [47, 4, 1, "", "init"], [47, 2, 1, "", "name"], [47, 4, 1, "", "predict"], [47, 4, 1, "", "train"], [47, 4, 1, "", "update_actor"], [47, 4, 1, "", "update_alpha"], [47, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.SACMetrics": [[47, 2, 1, "", "actor_grads"], [47, 2, 1, "", "actor_loss"], [47, 2, 1, "", "alpha_loss"], [47, 2, 1, "", "critic_grads"], [47, 2, 1, "", "critic_loss"], [47, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.SACRunnerState": [[47, 2, 1, "", "actor_train_state"], [47, 2, 1, "", "alpha_train_state"], [47, 2, 1, "", "critic_train_state"], [47, 2, 1, "", "env_state"], [47, 2, 1, "", "global_step"], [47, 2, 1, "", "normalizer_state"], [47, 2, 1, "", "obs"], [47, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.SACState": [[47, 2, 1, "", "buffer_state"], [47, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.SACTrainingResult": [[47, 2, 1, "", "eval_rewards"], [47, 2, 1, "", "metrics"], [47, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.models": [[47, 1, 1, "", "AlphaCoef"], [47, 1, 1, "", "SACCNNActor"], [47, 1, 1, "", "SACCNNCritic"], [47, 1, 1, "", "SACMLPActor"], [47, 1, 1, "", "SACMLPCritic"], [47, 1, 1, "", "SACVectorCritic"], [47, 1, 1, "", "TanhTransformedDistribution"]], "arlbench.core.algorithms.sac.models.AlphaCoef": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "alpha_init"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNActor": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "log_std_max"], [47, 2, 1, "", "log_std_min"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNCritic": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPActor": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "log_std_max"], [47, 2, 1, "", "log_std_min"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPCritic": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACVectorCritic": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "critic"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "n_critics"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"]], "arlbench.core.algorithms.sac.models.TanhTransformedDistribution": [[47, 4, 1, "", "mode"]], "arlbench.core.algorithms.sac.sac": [[47, 1, 1, "", "SAC"], [47, 1, 1, "", "SACMetrics"], [47, 1, 1, "", "SACRunnerState"], [47, 1, 1, "", "SACState"], [47, 1, 1, "", "SACTrainState"], [47, 1, 1, "", "SACTrainingResult"], [47, 1, 1, "", "Transition"]], "arlbench.core.algorithms.sac.sac.SAC": [[47, 4, 1, "", "get_checkpoint_factory"], [47, 4, 1, "", "get_default_hpo_config"], [47, 4, 1, "", "get_default_nas_config"], [47, 4, 1, "", "get_hpo_config_space"], [47, 4, 1, "", "get_hpo_search_space"], [47, 4, 1, "", "get_nas_config_space"], [47, 4, 1, "", "init"], [47, 2, 1, "", "name"], [47, 4, 1, "", "predict"], [47, 4, 1, "", "train"], [47, 4, 1, "", "update_actor"], [47, 4, 1, "", "update_alpha"], [47, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.sac.SACMetrics": [[47, 2, 1, "", "actor_grads"], [47, 2, 1, "", "actor_loss"], [47, 2, 1, "", "alpha_loss"], [47, 2, 1, "", "critic_grads"], [47, 2, 1, "", "critic_loss"], [47, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.sac.SACRunnerState": [[47, 2, 1, "", "actor_train_state"], [47, 2, 1, "", "alpha_train_state"], [47, 2, 1, "", "critic_train_state"], [47, 2, 1, "", "env_state"], [47, 2, 1, "", "global_step"], [47, 2, 1, "", "normalizer_state"], [47, 2, 1, "", "obs"], [47, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.sac.SACState": [[47, 2, 1, "", "buffer_state"], [47, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.sac.SACTrainState": [[47, 4, 1, "", "create_with_opt_state"], [47, 2, 1, "", "network_state"], [47, 4, 1, "", "replace"], [47, 2, 1, "", "target_params"]], "arlbench.core.algorithms.sac.sac.SACTrainingResult": [[47, 2, 1, "", "eval_rewards"], [47, 2, 1, "", "metrics"], [47, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.sac.Transition": [[47, 2, 1, "", "action"], [47, 2, 1, "", "done"], [47, 2, 1, "", "info"], [47, 2, 1, "", "obs"], [47, 2, 1, "", "reward"], [47, 2, 1, "", "value"]], "arlbench.core.environments": [[48, 1, 1, "", "BraxEnv"], [48, 1, 1, "", "Environment"], [48, 1, 1, "", "EnvpoolEnv"], [48, 1, 1, "", "GymnasiumEnv"], [48, 1, 1, "", "GymnaxEnv"], [48, 0, 0, "-", "autorl_env"], [48, 0, 0, "-", "brax_env"], [48, 0, 0, "-", "envpool_env"], [48, 0, 0, "-", "gymnasium_env"], [48, 0, 0, "-", "gymnax_env"], [48, 5, 1, "", "make_env"], [48, 0, 0, "-", "make_env"], [48, 0, 0, "-", "xland_env"]], "arlbench.core.environments.BraxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.Environment": [[48, 4, 1, "", "action_space"], [48, 3, 1, "", "env_name"], [48, 3, 1, "", "n_envs"], [48, 4, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_actions"], [48, 4, 1, "", "step"]], "arlbench.core.environments.EnvpoolEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.GymnasiumEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.GymnaxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_action"], [48, 4, 1, "", "step"]], "arlbench.core.environments.autorl_env": [[48, 1, 1, "", "Environment"]], "arlbench.core.environments.autorl_env.Environment": [[48, 4, 1, "", "action_space"], [48, 3, 1, "", "env_name"], [48, 3, 1, "", "n_envs"], [48, 4, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_actions"], [48, 4, 1, "", "step"]], "arlbench.core.environments.brax_env": [[48, 1, 1, "", "BraxEnv"]], "arlbench.core.environments.brax_env.BraxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.envpool_env": [[48, 1, 1, "", "EnvpoolEnv"], [48, 5, 1, "", "numpy_to_jax"]], "arlbench.core.environments.envpool_env.EnvpoolEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.gymnasium_env": [[48, 1, 1, "", "GymnasiumEnv"]], "arlbench.core.environments.gymnasium_env.GymnasiumEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.gymnax_env": [[48, 1, 1, "", "GymnaxEnv"]], "arlbench.core.environments.gymnax_env.GymnaxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_action"], [48, 4, 1, "", "step"]], "arlbench.core.environments.make_env": [[48, 5, 1, "", "make_env"]], "arlbench.core.environments.xland_env": [[48, 1, 1, "", "XLandEnv"]], "arlbench.core.environments.xland_env.XLandEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_action"], [48, 4, 1, "", "step"]], "arlbench.core.running_statistics": [[43, 1, 1, "", "NestedMeanStd"], [43, 1, 1, "", "RunningStatisticsState"], [43, 5, 1, "", "denormalize"], [43, 5, 1, "", "init_state"], [43, 5, 1, "", "normalize"], [43, 5, 1, "", "update"]], "arlbench.core.running_statistics.NestedMeanStd": [[43, 2, 1, "", "mean"], [43, 4, 1, "", "replace"], [43, 2, 1, "", "std"]], "arlbench.core.running_statistics.RunningStatisticsState": [[43, 2, 1, "", "count"], [43, 4, 1, "", "replace"], [43, 2, 1, "", "summed_variance"]], "arlbench.core.wrappers": [[49, 1, 1, "", "FlattenObservationWrapper"], [49, 1, 1, "", "Wrapper"], [49, 0, 0, "-", "flatten_observation"], [49, 0, 0, "-", "wrapper"]], "arlbench.core.wrappers.FlattenObservationWrapper": [[49, 3, 1, "", "observation_space"], [49, 4, 1, "", "reset"], [49, 4, 1, "", "step"]], "arlbench.core.wrappers.flatten_observation": [[49, 1, 1, "", "FlattenObservationWrapper"]], "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper": [[49, 3, 1, "", "observation_space"], [49, 4, 1, "", "reset"], [49, 4, 1, "", "step"]], "arlbench.core.wrappers.wrapper": [[49, 1, 1, "", "Wrapper"]], "arlbench.utils": [[50, 0, 0, "-", "common"], [50, 5, 1, "", "config_space_to_gymnasium_space"], [50, 5, 1, "", "config_space_to_yaml"], [50, 5, 1, "", "gymnasium_space_to_gymnax_space"], [50, 5, 1, "", "recursive_concat"], [50, 5, 1, "", "save_defaults_to_yaml"], [50, 5, 1, "", "tuple_concat"]], "arlbench.utils.common": [[50, 5, 1, "", "config_space_to_gymnasium_space"], [50, 5, 1, "", "config_space_to_yaml"], [50, 5, 1, "", "gymnasium_space_to_gymnax_space"], [50, 5, 1, "", "recursive_concat"], [50, 5, 1, "", "save_defaults_to_yaml"], [50, 5, 1, "", "tuple_concat"]]}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "property", "Python property"], "4": ["py", "method", "Python method"], "5": ["py", "function", "Python function"]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:attribute", "3": "py:property", "4": "py:method", "5": "py:function"}, "terms": {"": [5, 6, 13, 14, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 41, 44, 45, 46, 47, 52], "0": [17, 18, 20, 22, 23, 24, 25, 26, 27, 33, 35, 39, 40, 42, 43, 44, 45, 46, 47, 48, 50], "06": [35, 43], "1": [17, 18, 20, 22, 24, 25, 26, 27, 33, 42, 45, 46, 47, 48, 60], "10": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 60], "100": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "1000000": [13, 14, 17, 18, 20, 22, 24, 26, 35, 43, 44, 45, 46, 47], "1e": [35, 43], "2": [17, 18, 20, 22, 24, 25, 26, 35, 42, 43, 45, 46, 47, 60], "20": [25, 47], "24": [35, 43], "3": [17, 18, 20, 22, 24, 26, 45, 46, 47, 60], "31": [35, 43], "4": [17, 18, 20, 22, 24, 26, 45, 46, 47], "5": [17, 18, 20, 22, 24, 26, 45, 46, 47], "512": [19, 21, 25, 45, 46, 47], "6": [20, 22, 23, 24, 26, 44, 46, 47], "64": [19, 21, 25, 45, 46, 47], "64bit": [35, 43], "7": [20, 22, 24, 26, 46, 47], "8": [20, 22, 46], "A": [16, 19, 21, 25, 27, 29, 31, 32, 34, 35, 43, 44, 45, 46, 47, 48, 58], "As": [20, 22, 27, 28, 46, 48], "If": [5, 7, 8, 23, 35, 41, 42, 43, 44, 52, 60], "In": [5, 7, 8, 41, 42, 52], "It": [10, 11, 42, 57], "Not": [13, 17, 18, 24, 26, 44, 45, 47], "The": [9, 13, 14, 19, 21, 23, 25, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 57, 58, 60], "Then": 60, "There": 60, "These": [27, 28, 48], "To": [35, 43], "With": [5, 7, 8, 41, 42], "_": [13, 20, 22, 24, 26, 44, 46, 47, 48], "__call__": [10, 11, 19, 21, 25, 41, 42, 44, 45, 46, 47], "__init__": [19, 21, 25, 45, 46, 47], "__lt__": [10, 41, 42], "__new__": [10, 11, 41, 42], "__setattr__": [19, 21, 25, 45, 46, 47], "_description_": [5, 7, 8, 13, 24, 26, 27, 28, 33, 39, 40, 41, 42, 44, 47, 48, 50], "_imag": [35, 43], "_sentinel": [19, 21, 25, 45, 46, 47], "_type_": [39, 40, 50], "abc": [10, 11, 13, 14, 27, 28, 42, 44, 48], "abstract": [10, 11, 13, 14, 27, 28, 42, 44, 48], "access": [19, 21, 25, 45, 46, 47], "accumul": [35, 43], "acm": [35, 43], "across": [20, 22, 46], "act": [23, 44], "action": [5, 7, 8, 13, 14, 16, 17, 18, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49], "action_dim": [19, 21, 25, 44, 45, 46, 47], "action_s": [13, 14, 44], "action_spac": [5, 7, 8, 27, 28, 29, 30, 31, 32, 34, 41, 42, 43, 48, 61], "action_typ": [13, 14, 43, 44], "activ": [19, 21, 25, 44, 45, 46, 47, 60], "actor": [13, 21, 24, 25, 26, 44, 46, 47, 58], "actor_grad": [24, 26, 44, 47], "actor_loss": [13, 24, 26, 44, 47], "actor_network_param": [13, 24, 26, 44, 47], "actor_opt_st": [13, 24, 26, 44, 47], "actor_train_st": [13, 24, 26, 44, 47], "actual": [27, 28, 48, 52, 57], "ad": [23, 44], "adapt": [13, 14, 15, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "add": [23, 44], "add_batch": [23, 44], "add_sequ": [23, 44], "addit": [5, 7, 8, 41, 42], "advantag": [10, 11, 20, 22, 42, 44, 46], "after": [35, 43], "agent": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "algorithm": [5, 7, 8, 9, 27, 28, 39, 40, 41, 42, 43, 48, 50, 52, 58, 61], "algorithm_kw_arg": [9, 42], "algorithm_st": [9, 13, 14, 42, 44], "algorithmst": [9, 42], "alia": [17, 18, 20, 22, 24, 26, 45, 46, 47], "all": [9, 13, 14, 17, 18, 20, 22, 24, 26, 35, 42, 43, 44, 45, 46, 47, 52], "allow": [10, 11, 42], "alongsid": 52, "alpha": [13, 23, 24, 25, 26, 44, 47], "alpha_init": [25, 44, 47], "alpha_loss": [13, 24, 26, 44, 47], "alpha_network_param": [13, 24, 26, 44, 47], "alpha_opt_st": [13, 24, 26, 44, 47], "alpha_train_st": [13, 24, 26, 44, 47], "alphacoef": [25, 44, 47], "also": 57, "alwai": [20, 22, 46, 57], "among": [13, 14, 44], "an": [9, 10, 11, 16, 19, 21, 23, 25, 27, 28, 30, 35, 42, 43, 44, 45, 46, 47, 48, 52, 58], "ani": [9, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 33, 35, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49], "anoth": [19, 21, 25, 45, 46, 47], "append": [9, 42], "appli": [19, 21, 25, 45, 46, 47, 58], "apply_fn": [18, 22, 26, 45, 46, 47], "approxim": 58, "ar": [9, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 35, 36, 37, 42, 43, 44, 45, 46, 47, 49, 57, 60], "architectur": [13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 44, 45, 46, 47, 50], "arg": [10, 11, 25, 42, 47], "argument": [27, 33, 48], "arlbench": [52, 57, 60], "arlbenchmark": 52, "around": [10, 11, 42], "arrai": [5, 7, 8, 17, 18, 20, 22, 24, 25, 26, 27, 28, 30, 35, 41, 42, 43, 44, 45, 46, 47, 48], "aspect": 52, "assign": [19, 21, 25, 45, 46, 47], "attribut": [9, 19, 21, 25, 42, 45, 46, 47], "autom": [5, 7, 8, 41, 42, 58], "automl": [58, 60], "autorl": [5, 41, 58, 61], "autorl_config": [9, 42], "autorl_env": [41, 43, 61], "autorlenv": [5, 7, 8, 41, 42, 61], "axi": [35, 39, 40, 43, 50], "base": [5, 7, 8, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 46, 47, 48, 49], "baselines3": [21, 25, 46, 47], "basi": 52, "basic": [10, 11, 13, 14, 42, 44], "batch": [13, 15, 17, 18, 23, 24, 26, 35, 43, 44, 45, 47], "batch_siz": [15, 44], "bayesian": 58, "befor": [5, 7, 8, 19, 21, 25, 35, 41, 42, 43, 45, 46, 47], "behaviour": [10, 11, 42], "being": [19, 21, 23, 25, 44, 45, 46, 47], "best": [52, 58, 60], "between": [10, 15, 42, 44], "black": [52, 58], "blob": [21, 25, 35, 43, 46, 47], "bo": 58, "bool": [5, 7, 8, 9, 10, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 35, 41, 42, 43, 44, 45, 46, 47, 48], "bool_": [20, 22, 24, 26, 44, 46, 47, 48], "both": [27, 28, 48], "bound": [19, 21, 25, 45, 46, 47], "box": [36, 37, 49, 52, 58], "branch": 57, "brax": [27, 29, 33, 48], "brax_env": [41, 43], "braxenv": [27, 29, 43, 48], "buffer": [9, 13, 14, 17, 18, 20, 22, 23, 41, 42, 43, 45, 46], "buffer_dir": [9, 42], "buffer_st": [9, 13, 14, 17, 18, 20, 22, 24, 26, 42, 44, 45, 46, 47], "c_episod": [9, 42], "c_step": [9, 42], "calcul": [10, 11, 25, 42, 47], "call": [5, 7, 8, 10, 11, 19, 21, 23, 25, 36, 37, 41, 42, 44, 45, 46, 47, 49], "callabl": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "can": [10, 11, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 42, 44, 45, 46, 47, 52, 57, 58, 60], "captur": [16, 44], "carbon": [10, 42], "case": [19, 21, 25, 45, 46, 47, 52], "caus": [19, 21, 25, 45, 46, 47], "caution": 57, "cd": 60, "certain": [9, 42], "cfg": [5, 6, 41], "checkpoint": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 44, 45, 46, 47, 61], "checkpoint_dir": [9, 42], "checkpoint_nam": [9, 42], "checkpoint_path": [5, 7, 8, 9, 41, 42], "chex": [13, 14, 15, 17, 18, 20, 22, 24, 26, 36, 37, 44, 45, 46, 47, 49], "choos": 52, "chosen": [23, 44], "cl": [10, 11, 42], "class": [5, 7, 8, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 46, 47, 48, 49], "classmethod": [45, 46, 47], "clear": 57, "clearli": 57, "clip": 58, "clone": 60, "cnn": [19, 21, 25, 45, 46, 47], "cnn_polici": [13, 17, 18, 20, 22, 24, 26, 27, 33, 34, 44, 45, 46, 47, 48], "cnnactorcrit": [21, 44, 46], "cnnq": [19, 44, 45], "code": [10, 42, 57], "coeffici": [25, 47], "com": [21, 25, 35, 43, 46, 47, 60], "command": 60, "common": [9, 21, 25, 41, 42, 43, 46, 47, 61], "common_gotchas_in_jax": [35, 43], "compact": [19, 21, 25, 45, 46, 47], "compar": [10, 42], "comparison": [10, 42, 57], "compat": [27, 33, 48], "comput": [35, 43], "concat": [39, 40, 50], "concaten": [39, 40, 50], "conda": 60, "config": [5, 6, 7, 8, 41, 42, 61], "config_kei": [39, 40, 50], "config_spac": [5, 7, 8, 39, 40, 41, 42, 50, 61], "config_space_to_gymnasium_spac": [39, 40, 41, 50], "config_space_to_yaml": [39, 40, 41, 50], "configspac": [5, 7, 8, 39, 40, 41, 42, 50], "configur": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 41, 42, 44, 45, 46, 47, 50, 52], "configurationspac": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 41, 42, 44, 45, 46, 47, 50], "consid": [35, 43], "consist": [17, 18, 20, 22, 24, 26, 45, 46, 47], "construct": [3, 19, 21, 25, 45, 46, 47], "contain": [9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 35, 42, 43, 44, 45, 46, 47, 48], "content": 61, "conv": [19, 21, 25, 45, 46, 47], "conv1": [19, 21, 25, 45, 46, 47], "converst": [39, 40, 50], "convert": [30, 39, 40, 48, 50], "core": [41, 42, 61], "correctli": 57, "correspond": [35, 43], "count": [35, 41, 43], "cpu": [23, 44], "creat": [5, 7, 8, 10, 11, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 41, 42, 44, 45, 46, 47, 48, 60], "create_prioritised_item_buff": [23, 43, 44], "create_with_opt_st": [44, 45, 46, 47], "critic": [13, 21, 24, 25, 26, 44, 46, 47, 58], "critic_grad": [24, 26, 44, 47], "critic_loss": [13, 24, 26, 44, 47], "critic_network_param": [13, 24, 26, 44, 47], "critic_opt_st": [13, 24, 26, 44, 47], "critic_target_param": [13, 24, 26, 44, 47], "critic_train_st": [13, 24, 26, 44, 47], "cumul": [13, 14, 44], "cur_reward": [20, 22, 44, 46], "current": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 52], "d": [16, 44], "data": [9, 23, 35, 42, 43, 44], "decid": 52, "deep": [13, 17, 18, 44, 45, 58], "deepmind": [35, 43], "def": [19, 21, 25, 45, 46, 47], "default": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 35, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50], "defin": [13, 14, 19, 21, 25, 44, 45, 46, 47, 52, 57], "degrad": [35, 43], "denorm": [35, 41, 43], "depend": [23, 35, 43, 44], "determinist": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "deterministic_ev": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "deviat": [10, 35, 42, 43, 52], "devic": [23, 44], "dict": [5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 27, 33, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50], "dict1": [39, 40, 50], "dict2": [39, 40, 50], "dictionari": [9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 42, 44, 45, 46, 47, 50], "differ": [13, 14, 44, 52, 57, 58], "dimens": [35, 43], "directli": [10, 11, 42], "directori": [9, 42], "discret": [13, 14, 19, 21, 44, 45, 46], "discuss": 52, "disk": [9, 42], "distrax": [25, 47], "distribut": [25, 47], "dlr": [21, 25, 46, 47], "do": [10, 11, 42, 57], "doc": [35, 43], "document": 52, "doe": [19, 20, 21, 22, 25, 45, 46, 47], "doesn": [35, 43], "dolor": 59, "done": [9, 10, 11, 13, 16, 17, 18, 22, 26, 42, 43, 44, 45, 46, 47, 58, 60], "doubl": [35, 43], "download": 60, "dqn": [13, 24, 26, 41, 42, 43, 44, 47, 52, 58], "dqnmetric": [17, 18, 44, 45], "dqnrunnerst": [13, 17, 18, 44, 45], "dqnstate": [13, 17, 18, 44, 45], "dqntrainingresult": [13, 17, 18, 44, 45], "dqntrainreturnt": [13, 17, 18, 44, 45], "dqntrainstat": [13, 17, 18, 44, 45], "dtype": [35, 43], "dummi": [9, 42], "dummy_buffer_st": [9, 42], "dure": [5, 7, 8, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "dynam": [35, 43], "each": [5, 7, 8, 23, 27, 28, 41, 42, 44, 48], "earlier": [35, 43], "either": [19, 21, 25, 45, 46, 47, 60], "element": [35, 39, 40, 43, 50], "emiss": [10, 41, 42], "empti": [5, 7, 8, 41, 42], "en": [35, 43], "enabl": [35, 43, 57], "entropi": [13, 24, 26, 44, 47, 58], "env": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 38, 41, 42, 44, 45, 46, 47, 48, 49], "env_framework": [27, 33, 48], "env_kwarg": [27, 29, 30, 31, 32, 33, 34, 48], "env_nam": [27, 28, 29, 30, 31, 32, 33, 34, 43, 48], "env_stat": [17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49], "environ": [5, 7, 8, 9, 10, 11, 13, 14, 16, 36, 37, 41, 42, 43, 44, 49, 52, 57, 58, 60], "envpool": [27, 30, 33, 48, 60], "envpool_env": [41, 43], "envpoolenv": [27, 30, 43, 48], "episod": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "equival": [23, 27, 33, 35, 43, 44, 48], "error": [5, 7, 8, 41, 42], "etc": [27, 33, 35, 43, 48], "eval": [5, 7, 8, 13, 14, 41, 42, 43, 44, 61], "eval_env": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "eval_reward": [17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "evalu": [5, 7, 8, 10, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 52], "evalut": [5, 7, 8, 41, 42], "even": [35, 43], "exisit": 57, "experi": [13, 15, 24, 26, 44, 47, 52, 57], "exploit": 58, "explor": 58, "expon": [23, 44], "extract": [39, 40, 50], "facilit": 57, "factori": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "fals": [13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 34, 44, 45, 46, 47, 48], "featur": [5, 7, 8, 11, 41, 42], "fidel": 58, "field": [17, 18, 20, 22, 24, 26, 35, 43, 45, 46, 47], "file": [35, 39, 40, 43, 50], "final": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "find": [57, 58], "first": [10, 11, 39, 40, 42, 50, 60], "fit": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "flatten": [36, 37, 49], "flatten_observ": [41, 43], "flattenobservationwrapp": [36, 37, 43, 49], "flax": [19, 21, 25, 45, 46, 47], "float": [5, 6, 23, 35, 41, 43, 44, 47], "float32": [35, 43], "focus": 52, "follow": [19, 21, 25, 27, 28, 33, 45, 46, 47, 48, 60], "found": [52, 57], "framework": [27, 33, 48, 57], "free": 57, "from": [9, 35, 42, 43, 52, 58, 60], "from_tupl": [43, 44], "frozendict": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "full": [35, 43], "fulli": [27, 28, 48], "function": [6, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 35, 36, 37, 40, 42, 43, 44, 45, 46, 47, 48, 49, 58], "gener": [13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49], "get_checkpoint_factori": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_default_hpo_config": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_default_nas_config": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_hpo_config_spac": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_hpo_search_spac": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_nas_config_spac": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_spec": [10, 41, 42], "get_state_spac": [11, 41, 42], "git": 60, "github": [21, 25, 35, 43, 46, 47, 60], "give": [19, 21, 25, 45, 46, 47], "given": [5, 6, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 35, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 58], "global_step": [17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "good": 52, "gpu": [23, 44], "grad": [11, 13, 17, 18, 20, 22, 42, 44, 45, 46], "grad_info": 42, "gradient": [11, 42, 58], "gradinfo": [11, 41, 42], "gymnasium": [5, 7, 8, 27, 28, 31, 33, 39, 40, 41, 42, 48, 50, 57], "gymnasium_env": [41, 43], "gymnasium_space_to_gymnax_spac": [39, 40, 41, 50], "gymnasiumenv": [27, 31, 43, 48], "gymnax": [27, 28, 29, 30, 31, 32, 33, 34, 39, 40, 48, 50], "gymnax_env": [41, 43], "gymnax_spac": [39, 40, 50], "gymnaxenv": [27, 32, 43, 48], "gynasium": [5, 7, 8, 41, 42], "gynmasium": [5, 7, 8, 41, 42], "ha": [27, 33, 48], "happen": [19, 21, 25, 45, 46, 47], "have": [35, 43, 57], "here": [19, 21, 25, 45, 46, 47], "hidden_s": [19, 21, 25, 44, 45, 46, 47], "hierarchi": [35, 43], "how": 52, "howev": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 52, 57], "hp_config": [9, 39, 40, 42, 50], "hp_config_spac": [39, 40, 50], "hpo": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 52, 58], "hpo_config": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 61], "html": [35, 43], "http": [21, 25, 35, 43, 46, 47], "hyperparamet": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 41, 42, 44, 45, 46, 47, 50, 52, 58], "i": [3, 5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 41, 42, 44, 45, 46, 47, 52, 57, 60], "id": [9, 27, 28, 33, 42, 48], "ideal": 57, "identifi": [9, 42], "imit": [10, 11, 42], "immedi": [19, 21, 25, 45, 46, 47], "impact": [35, 43], "implement": [10, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 42, 44, 45, 46, 47, 48], "import": 52, "improv": [35, 43, 58], "includ": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "independ": [23, 44], "inexact": [35, 43], "info": [18, 22, 26, 44, 45, 46, 47], "inform": [5, 7, 8, 11, 41, 42], "infot": [5, 7, 8, 41, 42], "init": [13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 43, 44, 45, 46, 47], "init_and_output": [19, 21, 25, 45, 46, 47], "init_st": [35, 41, 43], "initi": [5, 7, 8, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 35, 41, 42, 43, 44, 45, 46, 47], "insid": [19, 21, 25, 45, 46, 47], "instanc": [10, 11, 19, 21, 25, 42, 45, 46, 47], "instead": 60, "int": [5, 7, 8, 9, 13, 14, 15, 17, 18, 20, 22, 23, 24, 26, 27, 28, 33, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50], "int32": [35, 43], "integ": [35, 43], "interact": [16, 44], "intern": [27, 28, 36, 37, 48, 49], "interv": [15, 44], "invok": [19, 21, 25, 45, 46, 47], "io": [35, 43], "ipsum": 59, "is_weight": [13, 17, 18, 24, 26, 44, 45, 47], "item": [16, 23, 43, 44], "iter": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "its": [5, 7, 8, 36, 37, 41, 42, 49, 58], "jax": [13, 17, 18, 20, 22, 24, 26, 27, 28, 30, 33, 35, 43, 44, 45, 46, 47, 48], "jax_enable_x64": [35, 43], "jit": [35, 43, 57], "jittabl": [27, 28, 48], "jnp": [13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 35, 36, 37, 43, 44, 45, 46, 47, 48, 49], "json": 42, "just": 60, "keep": [10, 11, 42], "kei": [13, 14, 15, 16, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "kept": [20, 22, 46], "keyword": [27, 33, 48], "kind": [27, 28, 48], "know": [9, 42], "kwarg": [10, 11, 25, 42, 44, 45, 46, 47], "l48": [21, 25, 46, 47], "larg": [35, 43], "last": [9, 10, 42], "last_ob": [16, 43, 44], "latest": [35, 43, 60], "lazi": [19, 21, 25, 45, 46, 47], "lazili": [19, 21, 25, 45, 46, 47], "learn": [5, 7, 8, 13, 14, 41, 42, 44, 58], "leav": [35, 43], "length": [15, 23, 44], "less": [10, 42], "level": [5, 41, 58], "like": [5, 7, 8, 16, 19, 21, 25, 41, 42, 44, 45, 46, 47, 60], "line": [19, 21, 25, 45, 46, 47], "linen": [19, 21, 25, 45, 46, 47], "linux": 60, "list": [5, 6, 7, 8, 41, 42], "load": [9, 41, 42], "load_buff": [9, 41, 42], "log_prob": [22, 44, 46], "log_std_max": [25, 44, 47], "log_std_min": [25, 44, 47], "logger": [5, 6, 41], "lorem": 59, "loss": [13, 17, 18, 20, 22, 44, 45, 46], "machin": 58, "make": [23, 44, 60], "make_env": [27, 41, 43], "make_prioritised_item_buff": [23, 43, 44], "mani": 57, "map": [16, 44], "master": [21, 25, 35, 43, 46, 47], "match": [27, 33, 35, 43, 48], "max_abs_valu": [35, 43], "max_length": [23, 44], "max_recorded_prior": 42, "maxim": [10, 42], "maximum": [23, 35, 43, 44, 58], "mean": [10, 35, 41, 42, 43], "mean_std": [35, 43], "measur": [10, 42], "method": [9, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 42, 44, 45, 46, 47, 48, 58], "metric": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "min_length": [23, 44], "minim": [10, 42], "minimum": [23, 35, 43, 44, 58], "mlp": [19, 21, 25, 45, 46, 47], "mlpactorcrit": [21, 44, 46], "mlpq": [19, 44, 45], "mode": [25, 44, 47], "model": [43, 44, 58], "modifi": [35, 43], "modul": [5, 7, 12, 13, 17, 19, 20, 21, 24, 25, 27, 36, 39, 61], "more": [23, 44, 52], "most": 52, "mrp_file": [41, 42], "multi": 58, "multipl": 58, "must": [27, 33, 35, 43, 48], "mymodul": [19, 21, 25, 45, 46, 47], "n": 60, "n_critic": [25, 44, 47], "n_env": [13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 29, 30, 32, 33, 34, 43, 44, 45, 46, 47, 48], "n_eval_episod": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "n_eval_step": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "n_total_timestep": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "name": [9, 19, 21, 25, 27, 28, 33, 35, 39, 40, 42, 43, 44, 45, 46, 47, 48, 50], "namedtupl": [17, 18, 20, 22, 24, 26, 45, 46, 47], "nas_config": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "nas_config_sapc": [39, 40, 50], "naturecnn": [21, 25, 46, 47], "ndarrai": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 35, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49], "need": [27, 28, 48], "nest": [35, 43], "nestedmeanstd": [35, 41, 43], "network": [13, 17, 18, 19, 20, 21, 22, 24, 25, 26, 44, 45, 46, 47, 58], "network_param": [13, 17, 18, 20, 22, 44, 45, 46], "network_st": [44, 47], "neural": [13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 44, 45, 46, 47, 50, 58], "new": [10, 11, 18, 22, 26, 35, 42, 43, 45, 46, 47], "next": [13, 17, 18, 44, 45], "next_observ": [13, 17, 18, 44, 45], "nn": [19, 21, 25, 45, 46, 47], "node": 42, "nodes_fil": [41, 42], "none": [5, 6, 7, 8, 9, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50], "norm": [11, 42], "normal": [35, 41, 43], "normalizer_st": [17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "note": [20, 22, 27, 28, 35, 43, 46, 48], "notebook": [35, 43], "now": [19, 21, 25, 45, 46, 47], "np": [5, 7, 8, 41, 42], "npy": 42, "num_eval_episod": [5, 7, 8, 13, 14, 41, 42, 44], "number": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 33, 36, 37, 41, 42, 44, 45, 46, 47, 48, 49], "numpi": [30, 35, 43, 48], "numpy_to_jax": [30, 43, 48], "ob": [13, 14, 16, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "object": [5, 6, 7, 8, 9, 11, 16, 18, 19, 21, 22, 25, 26, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 49, 50, 52, 58, 61], "objectivest": [5, 7, 8, 41, 42], "objectv": [10, 42], "obser": [36, 37, 49], "observ": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 44, 45, 46, 47, 48, 49], "observation_spac": [5, 7, 8, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 43, 48, 49, 61], "observationt": [5, 7, 8, 41, 42], "off": 58, "onc": [19, 21, 25, 45, 46, 47], "one": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 33, 41, 42, 44, 45, 46, 47, 48, 52, 60], "ones": 57, "onli": [20, 22, 35, 43, 46], "oper": [23, 44], "opt_stat": [13, 17, 18, 20, 22, 26, 44, 45, 46, 47], "optax": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "optim": [10, 13, 17, 18, 20, 22, 23, 24, 26, 42, 44, 45, 46, 47, 52, 58], "optimize_object": [10, 42], "option": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50], "optstat": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "org": [35, 43], "other": [10, 13, 17, 18, 19, 20, 21, 22, 24, 25, 26, 42, 44, 45, 46, 47], "overflow": [35, 43], "overrid": [10, 11, 42], "overriden": [9, 42], "own": [52, 57], "packag": [5, 60, 61], "page": 3, "paper": [23, 44, 57], "param": [13, 17, 18, 20, 22, 26, 44, 45, 46, 47], "paramet": [5, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 20, 22, 23, 24, 26, 27, 28, 33, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "parent": [19, 21, 25, 44, 45, 46, 47], "part": [9, 42], "pass": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 33, 35, 41, 42, 43, 44, 45, 46, 47, 48], "path": [5, 7, 8, 9, 41, 42], "per": [5, 7, 8, 13, 14, 17, 18, 20, 22, 23, 24, 26, 41, 42, 44, 45, 46, 47], "perform": [5, 7, 8, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 28, 35, 41, 42, 43, 44, 45, 46, 47, 48], "period": [15, 44], "pip": 60, "pleas": 52, "pmap": [35, 43], "pmap_axis_nam": [35, 43], "png": [35, 43], "point": [35, 43], "polici": [13, 20, 22, 44, 46, 58], "possibl": [13, 14, 44], "possibli": [35, 43], "posssibl": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "ppo": [13, 24, 25, 26, 41, 42, 43, 44, 47, 52, 58], "ppometr": [20, 22, 44, 46], "pporunnerst": [13, 20, 22, 44, 46], "ppostat": [13, 20, 22, 44, 46], "ppotrainingresult": [13, 20, 22, 44, 46], "ppotrainreturnt": [13, 20, 22, 44, 46], "ppotrainst": [20, 22, 44, 46], "pre": 52, "precis": [35, 43], "predefin": 58, "predict": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "principl": 58, "prioriti": [9, 23, 42, 44], "prioritis": [23, 44], "prioritised_item_buff": [41, 43], "prioritisedtrajectorybuff": [23, 44], "prioritisedtrajectorybufferst": [9, 13, 15, 17, 18, 24, 26, 42, 44, 45, 47], "priority_expon": [23, 44], "priority_state_path": [9, 42], "prioriz": [15, 44], "prngkei": [13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49], "problem": 58, "proce": 57, "process": 58, "promin": 52, "properti": [5, 7, 8, 13, 14, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 44, 48, 49], "propos": 52, "provid": [16, 44, 52, 57], "proxim": [13, 20, 22, 44, 46, 58], "py": [21, 25, 35, 43, 46, 47], "pypi": 60, "python": 60, "q": [13, 17, 18, 19, 44, 45, 58], "question": 52, "rais": [5, 7, 8, 41, 42], "random": [5, 7, 8, 13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 33, 36, 37, 41, 42, 44, 45, 46, 47, 48, 49, 58], "randomli": 58, "rang": [35, 43], "rank": [10, 41, 42], "re": [5, 7, 8, 41, 42, 57], "readthedoc": [35, 43], "real": 58, "reason": 52, "recurs": [39, 40, 50], "recursive_concat": [39, 40, 41, 50], "reinforc": [5, 7, 8, 13, 14, 41, 42, 44, 58], "relat": [9, 42], "replac": [18, 22, 26, 35, 41, 43, 44, 45, 46, 47], "repo": 57, "report": [52, 57], "repositori": 60, "requir": [9, 42], "reset": [5, 7, 8, 27, 28, 36, 37, 41, 42, 43, 48, 49, 61], "restor": [9, 42], "result": [9, 13, 14, 17, 18, 20, 22, 24, 26, 35, 36, 37, 42, 43, 44, 45, 46, 47, 49, 52, 57], "return": [5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "return_buff": [20, 22, 44, 46], "return_buffer_idx": [20, 22, 44, 46], "reward": [10, 13, 14, 16, 17, 18, 22, 26, 42, 43, 44, 45, 46, 47], "reward_mean": 42, "reward_std": 42, "rewardmean": [10, 41, 42], "rewardstd": [10, 41, 42], "rl": [5, 7, 8, 27, 28, 29, 30, 31, 32, 33, 34, 41, 42, 48, 52], "rm": [21, 25, 46, 47], "rng": [13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49], "rng_kei": [15, 44], "run": [5, 6, 7, 8, 35, 41, 42, 43, 52, 60], "run_arlbench": [5, 6, 41, 61], "runner": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "runner_st": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "running_statist": [41, 61], "runningstatisticsst": [17, 18, 20, 22, 24, 26, 35, 41, 43, 45, 46, 47], "runtim": [10, 41, 42], "sac": [13, 41, 42, 43, 44, 52, 58], "saccnnactor": [25, 44, 47], "saccnncrit": [25, 44, 47], "sacmetr": [24, 26, 44, 47], "sacmlpactor": [25, 44, 47], "sacmlpcrit": [25, 44, 47], "sacrunnerst": [13, 24, 26, 44, 47], "sacstat": [13, 24, 26, 44, 47], "sactrainingresult": [13, 24, 26, 44, 47], "sactrainreturnt": [13, 24, 26, 44, 47], "sactrainst": [13, 24, 26, 44, 47], "sacvectorcrit": [25, 44, 47], "safe": [19, 21, 25, 45, 46, 47], "same": [35, 39, 40, 43, 50], "sampl": [13, 14, 15, 17, 18, 20, 22, 23, 24, 26, 27, 28, 44, 45, 46, 47, 48, 58], "sample_act": [27, 28, 43, 48], "sample_batch_s": [23, 44], "save": [9, 41, 42], "save_buff": [9, 41, 42], "save_defaults_to_yaml": [39, 40, 41, 50], "scalar": 42, "scalars_fil": [41, 42], "scope": [44, 45, 46, 47], "search": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 52, 57, 58], "second": [39, 40, 50, 60], "section": 52, "see": [19, 21, 25, 35, 43, 45, 46, 47], "seed": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 30, 31, 33, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50, 52], "select": 52, "self": [10, 11, 19, 21, 25, 42, 45, 46, 47], "sequenc": [15, 23, 44], "sequence_length": [15, 44], "set": [16, 35, 43, 44], "setup": [19, 21, 25, 44, 45, 46, 47], "sever": 52, "shape": [13, 14, 35, 43, 44], "share": [13, 14, 44], "should": [35, 43, 57], "similar": [19, 21, 25, 45, 46, 47], "simplest": [52, 60], "simplifi": [35, 43], "sinc": 52, "singl": [9, 23, 42, 44], "size": [9, 13, 14, 15, 23, 42, 44], "so": 57, "soft": [13, 24, 26, 44, 47, 58], "sort": [10, 42], "sourc": [5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "space": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 52, 57, 58], "specif": [10, 11, 42], "specifi": [18, 22, 26, 35, 43, 45, 46, 47], "stabil": 58, "stabl": [21, 25, 35, 43, 46, 47], "stable_baselines3": [21, 25, 46, 47], "standard": [10, 35, 42, 43], "state": [5, 7, 8, 9, 11, 13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 35, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 57], "state_featur": [41, 61], "statefeatur": [11, 41, 42], "static": [9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 42, 44, 45, 46, 47], "statist": [35, 43], "std": [35, 41, 43], "std_max_valu": [35, 43], "std_min_valu": [35, 43], "step": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 61], "store": [9, 10, 11, 42], "str": [5, 7, 8, 9, 10, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 28, 33, 35, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50], "string": [39, 40, 50], "structur": [35, 43, 52], "sub": [27, 28, 48], "submodul": [19, 21, 25, 61], "subpackag": 61, "subpag": 52, "subsequ": [10, 11, 42], "subset": 52, "summed_vari": [35, 41, 43], "support": [15, 27, 28, 44, 48, 52], "surrog": 58, "system": 60, "t": [35, 43], "tag": [9, 42], "take": [27, 28, 36, 37, 48, 49], "taken": [35, 43], "tanh": [19, 21, 25, 45, 46, 47], "tanhtransformeddistribut": [25, 44, 47], "target": [13, 17, 18, 24, 26, 44, 45, 47, 52], "target_param": [13, 17, 18, 26, 44, 45, 47], "td_error": [13, 17, 18, 24, 26, 44, 45, 47], "termin": [5, 7, 8, 41, 42], "test": 52, "than": [10, 42, 57], "thi": [3, 5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 35, 41, 42, 43, 44, 45, 46, 47, 52, 57, 58, 60], "three": [19, 21, 25, 45, 46, 47, 52], "time": [23, 44], "timestep": [13, 14, 16, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "to_tupl": [43, 44], "top": [5, 41], "torch_lay": [21, 25, 46, 47], "total": [5, 7, 8, 10, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "tpu": [23, 44], "track_metr": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "track_trajectori": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "train": [5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 43, 44, 45, 46, 47], "train_func": [10, 11, 42], "train_result": [9, 13, 14, 17, 18, 20, 22, 24, 26, 42, 44, 45, 46, 47], "train_stat": [13, 17, 18, 20, 22, 44, 45, 46], "trainfunc": [10, 11, 42], "training_result": [13, 14, 44], "trainingi": [13, 24, 26, 44, 47], "trainresult": [9, 42], "trainstat": [18, 22, 26, 45, 46, 47], "trajectori": [13, 15, 17, 18, 20, 22, 23, 24, 26, 44, 45, 46, 47], "trajectorybufferst": [9, 42], "transform": [25, 47], "transit": [13, 17, 18, 20, 22, 23, 24, 26, 44, 45, 46, 47], "transitionsampl": [15, 44], "true": [13, 14, 17, 18, 19, 20, 21, 22, 24, 26, 35, 43, 44, 45, 46, 47], "truncat": [5, 7, 8, 41, 42], "tupl": [5, 6, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50], "tuple1": [39, 40, 50], "tuple2": [39, 40, 50], "tuple_concat": [39, 40, 41, 50], "twice": [35, 43], "two": [10, 39, 40, 42, 50, 60], "tx": [18, 22, 26, 45, 46, 47], "type": [5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "u": [10, 11, 42], "under": 3, "uniform": [15, 44], "uniform_sampl": [15, 43, 44], "union": [20, 22, 24, 26, 44, 45, 46, 47, 48], "uniqu": [9, 42], "unus": [13, 20, 22, 24, 26, 44, 46, 47], "updat": [13, 14, 17, 18, 20, 22, 24, 26, 35, 41, 43, 44, 45, 46, 47], "update_actor": [13, 24, 26, 43, 44, 47], "update_alpha": [13, 24, 26, 43, 44, 47], "update_crit": [13, 24, 26, 43, 44, 47], "update_hpo_config": [13, 14, 43, 44], "us": [5, 6, 7, 8, 10, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 35, 41, 42, 43, 44, 45, 46, 47, 48, 52, 57, 58, 60], "usecas": 52, "util": [35, 41, 43, 61], "valid": [35, 43], "validate_shap": [35, 43], "valu": [13, 16, 18, 22, 24, 26, 35, 39, 40, 43, 44, 45, 46, 47, 50], "valueerror": [5, 7, 8, 41, 42], "varianc": [35, 43], "varieti": 52, "variou": [27, 28, 48], "vault": [9, 42], "vault_uuid": [9, 42], "version": 60, "view": [16, 44], "virtual": 60, "wa": [5, 7, 8, 9, 35, 41, 42, 43], "wai": 60, "want": [52, 60], "we": [10, 11, 42, 52, 57], "weigh": 58, "weight": [13, 24, 26, 35, 43, 44, 47], "well": [9, 27, 28, 42, 48], "when": [19, 21, 25, 35, 43, 45, 46, 47, 57], "where": [9, 42, 57], "whether": [9, 10, 13, 14, 23, 24, 26, 42, 44, 47], "which": [9, 19, 21, 25, 42, 45, 46, 47, 52, 57], "while": [10, 11, 42, 60], "wise": [39, 40, 50], "work": [19, 21, 25, 45, 46, 47, 57], "workflow": 52, "world": 58, "would": [57, 60], "wrap": [10, 11, 19, 21, 25, 36, 37, 42, 45, 46, 47, 49, 57], "wrapper": [27, 33, 41, 43, 48], "write": [39, 40, 50], "x": [19, 21, 25, 30, 45, 46, 47, 48], "xland": [27, 33, 34, 48], "xland_env": [41, 43], "xlandenv": [34, 43, 48], "yaml": [39, 40, 50], "ye": 57, "yet": [19, 21, 25, 45, 46, 47], "you": [52, 57, 60], "your": [52, 57]}, "titles": ["Using the ARLBench States", "ARLBench and Different AutoRL Paradigms", "Dynamic Configuration in ARLBench", "Advanced Configuration Options", "API References", "arlbench", "arlbench.arlbench", "arlbench.autorl", "arlbench.autorl.autorl_env", "arlbench.autorl.checkpointing", "arlbench.autorl.objectives", "arlbench.autorl.state_features", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.algorithm", "arlbench.core.algorithms.buffers", "arlbench.core.algorithms.common", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.dqn.dqn", "arlbench.core.algorithms.dqn.models", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.ppo.models", "arlbench.core.algorithms.ppo.ppo", "arlbench.core.algorithms.prioritised_item_buffer", "arlbench.core.algorithms.sac", "arlbench.core.algorithms.sac.models", "arlbench.core.algorithms.sac.sac", "arlbench.core.environments", "arlbench.core.environments.autorl_env", "arlbench.core.environments.brax_env", "arlbench.core.environments.envpool_env", "arlbench.core.environments.gymnasium_env", "arlbench.core.environments.gymnax_env", "arlbench.core.environments.make_env", "arlbench.core.environments.xland_env", "arlbench.core.running_statistics", "arlbench.core.wrappers", "arlbench.core.wrappers.flatten_observation", "arlbench.core.wrappers.wrapper", "arlbench.utils", "arlbench.utils.common", "arlbench package", "arlbench.autorl package", "arlbench.core package", "arlbench.core.algorithms package", "arlbench.core.algorithms.dqn package", "arlbench.core.algorithms.ppo package", "arlbench.core.algorithms.sac package", "arlbench.core.environments package", "arlbench.core.wrappers package", "arlbench.utils package", "The ARLBench Subsets", "Benchmarking AutoRL Methods", "Objectives in ARLBench", "ARLBench Options", "Considerations for Seeding", "&lt;no title&gt;", "Frequently Asked Questions", "Glossary", "Home", "Installation", "arlbench"], "titleterms": {"The": 51, "advanc": 3, "algorithm": [13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 44, 45, 46, 47], "api": 4, "arlbench": [0, 1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 61], "ask": 57, "autorl": [1, 7, 8, 9, 10, 11, 42, 52], "autorl_env": [8, 28, 42, 48], "benchmark": 52, "brax_env": [29, 48], "buffer": [15, 44], "checkpoint": [9, 42], "common": [16, 40, 44, 50], "configur": [2, 3], "consider": 55, "content": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "core": [12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 43, 44, 45, 46, 47, 48, 49], "differ": 1, "dqn": [17, 18, 19, 45], "dynam": 2, "environ": [27, 28, 29, 30, 31, 32, 33, 34, 48], "envpool_env": [30, 48], "flatten_observ": [37, 49], "frequent": 57, "glossari": 58, "gymnasium_env": [31, 48], "gymnax_env": [32, 48], "home": 59, "instal": 60, "make_env": [33, 48], "method": 52, "model": [19, 21, 25, 45, 46, 47], "modul": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "object": [10, 42, 53], "option": [3, 54], "packag": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "paradigm": 1, "ppo": [20, 21, 22, 46], "prioritised_item_buff": [23, 44], "question": 57, "refer": 4, "running_statist": [35, 43], "sac": [24, 25, 26, 47], "seed": 55, "state": 0, "state_featur": [11, 42], "submodul": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "subpackag": [41, 43, 44], "subset": 51, "us": 0, "util": [39, 40, 50], "wrapper": [36, 37, 38, 49], "xland_env": [34, 48]}})
\ No newline at end of file
+Search.setIndex({"alltitles": {"API References": [[4, "api-references"]], "ARLBench Options": [[54, "arlbench-options"]], "ARLBench and Different AutoRL Paradigms": [[1, "arlbench-and-different-autorl-paradigms"]], "Advanced Configuration Options": [[3, "advanced-configuration-options"]], "Benchmarking AutoRL Methods": [[52, "benchmarking-autorl-methods"]], "Considerations for Seeding": [[55, "considerations-for-seeding"]], "Dynamic Configuration in ARLBench": [[2, "dynamic-configuration-in-arlbench"]], "Frequently Asked Questions": [[57, "frequently-asked-questions"]], "Glossary": [[58, "glossary"]], "Home": [[59, "home"]], "Installation": [[60, "installation"]], "Module contents": [[41, "module-arlbench"], [42, "module-arlbench.autorl"], [43, "module-arlbench.core"], [44, "module-arlbench.core.algorithms"], [45, "module-arlbench.core.algorithms.dqn"], [46, "module-arlbench.core.algorithms.ppo"], [47, "module-arlbench.core.algorithms.sac"], [48, "module-arlbench.core.environments"], [49, "module-arlbench.core.wrappers"], [50, "module-arlbench.utils"]], "Objectives in ARLBench": [[53, "objectives-in-arlbench"]], "Submodules": [[41, "submodules"], [42, "submodules"], [43, "submodules"], [44, "submodules"], [45, "submodules"], [46, "submodules"], [47, "submodules"], [48, "submodules"], [49, "submodules"], [50, "submodules"]], "Subpackages": [[41, "subpackages"], [43, "subpackages"], [44, "subpackages"]], "The ARLBench Subsets": [[51, "the-arlbench-subsets"]], "Using the ARLBench States": [[0, "using-the-arlbench-states"]], "arlbench": [[5, "module-arlbench"], [61, "arlbench"]], "arlbench package": [[41, "arlbench-package"]], "arlbench.arlbench": [[6, "module-arlbench.arlbench"]], "arlbench.arlbench module": [[41, "module-arlbench.arlbench"]], "arlbench.autorl": [[7, "module-arlbench.autorl"]], "arlbench.autorl package": [[42, "arlbench-autorl-package"]], "arlbench.autorl.autorl_env": [[8, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.autorl_env module": [[42, "module-arlbench.autorl.autorl_env"]], "arlbench.autorl.checkpointing": [[9, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.checkpointing module": [[42, "module-arlbench.autorl.checkpointing"]], "arlbench.autorl.objectives": [[10, "module-arlbench.autorl.objectives"]], "arlbench.autorl.objectives module": [[42, "module-arlbench.autorl.objectives"]], "arlbench.autorl.state_features": [[11, "module-arlbench.autorl.state_features"]], "arlbench.autorl.state_features module": [[42, "module-arlbench.autorl.state_features"]], "arlbench.core": [[12, "module-arlbench.core"]], "arlbench.core package": [[43, "arlbench-core-package"]], "arlbench.core.algorithms": [[13, "module-arlbench.core.algorithms"]], "arlbench.core.algorithms package": [[44, "arlbench-core-algorithms-package"]], "arlbench.core.algorithms.algorithm": [[14, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.algorithm module": [[44, "module-arlbench.core.algorithms.algorithm"]], "arlbench.core.algorithms.buffers": [[15, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.buffers module": [[44, "module-arlbench.core.algorithms.buffers"]], "arlbench.core.algorithms.common": [[16, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.common module": [[44, "module-arlbench.core.algorithms.common"]], "arlbench.core.algorithms.dqn": [[17, "module-arlbench.core.algorithms.dqn"]], "arlbench.core.algorithms.dqn package": [[45, "arlbench-core-algorithms-dqn-package"]], "arlbench.core.algorithms.dqn.dqn": [[18, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.dqn module": [[45, "module-arlbench.core.algorithms.dqn.dqn"]], "arlbench.core.algorithms.dqn.models": [[19, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.dqn.models module": [[45, "module-arlbench.core.algorithms.dqn.models"]], "arlbench.core.algorithms.ppo": [[20, "module-arlbench.core.algorithms.ppo"]], "arlbench.core.algorithms.ppo package": [[46, "arlbench-core-algorithms-ppo-package"]], "arlbench.core.algorithms.ppo.models": [[21, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.models module": [[46, "module-arlbench.core.algorithms.ppo.models"]], "arlbench.core.algorithms.ppo.ppo": [[22, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.ppo.ppo module": [[46, "module-arlbench.core.algorithms.ppo.ppo"]], "arlbench.core.algorithms.prioritised_item_buffer": [[23, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.prioritised_item_buffer module": [[44, "module-arlbench.core.algorithms.prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[24, "module-arlbench.core.algorithms.sac"]], "arlbench.core.algorithms.sac package": [[47, "arlbench-core-algorithms-sac-package"]], "arlbench.core.algorithms.sac.models": [[25, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.models module": [[47, "module-arlbench.core.algorithms.sac.models"]], "arlbench.core.algorithms.sac.sac": [[26, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.algorithms.sac.sac module": [[47, "module-arlbench.core.algorithms.sac.sac"]], "arlbench.core.environments": [[27, "module-arlbench.core.environments"]], "arlbench.core.environments package": [[48, "arlbench-core-environments-package"]], "arlbench.core.environments.autorl_env": [[28, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.autorl_env module": [[48, "module-arlbench.core.environments.autorl_env"]], "arlbench.core.environments.brax_env": [[29, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.brax_env module": [[48, "module-arlbench.core.environments.brax_env"]], "arlbench.core.environments.envpool_env": [[30, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.envpool_env module": [[48, "module-arlbench.core.environments.envpool_env"]], "arlbench.core.environments.gymnasium_env": [[31, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnasium_env module": [[48, "module-arlbench.core.environments.gymnasium_env"]], "arlbench.core.environments.gymnax_env": [[32, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.gymnax_env module": [[48, "module-arlbench.core.environments.gymnax_env"]], "arlbench.core.environments.make_env": [[33, "arlbench-core-environments-make-env"]], "arlbench.core.environments.make_env module": [[48, "module-arlbench.core.environments.make_env"]], "arlbench.core.environments.xland_env": [[34, "module-arlbench.core.environments.xland_env"]], "arlbench.core.environments.xland_env module": [[48, "module-arlbench.core.environments.xland_env"]], "arlbench.core.running_statistics": [[35, "module-arlbench.core.running_statistics"]], "arlbench.core.running_statistics module": [[43, "module-arlbench.core.running_statistics"]], "arlbench.core.wrappers": [[36, "module-arlbench.core.wrappers"]], "arlbench.core.wrappers package": [[49, "arlbench-core-wrappers-package"]], "arlbench.core.wrappers.flatten_observation": [[37, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.flatten_observation module": [[49, "module-arlbench.core.wrappers.flatten_observation"]], "arlbench.core.wrappers.wrapper": [[38, "module-arlbench.core.wrappers.wrapper"]], "arlbench.core.wrappers.wrapper module": [[49, "module-arlbench.core.wrappers.wrapper"]], "arlbench.utils": [[39, "module-arlbench.utils"]], "arlbench.utils package": [[50, "arlbench-utils-package"]], "arlbench.utils.common": [[40, "module-arlbench.utils.common"]], "arlbench.utils.common module": [[50, "module-arlbench.utils.common"]]}, "docnames": ["advanced_usage/algorithm_states", "advanced_usage/autorl_paradigms", "advanced_usage/dynamic_configuration", "advanced_usage/index", "api", "api/arlbench", "api/arlbench.arlbench", "api/arlbench.autorl", "api/arlbench.autorl.autorl_env", "api/arlbench.autorl.checkpointing", "api/arlbench.autorl.objectives", "api/arlbench.autorl.state_features", "api/arlbench.core", "api/arlbench.core.algorithms", "api/arlbench.core.algorithms.algorithm", "api/arlbench.core.algorithms.buffers", "api/arlbench.core.algorithms.common", "api/arlbench.core.algorithms.dqn", "api/arlbench.core.algorithms.dqn.dqn", "api/arlbench.core.algorithms.dqn.models", "api/arlbench.core.algorithms.ppo", "api/arlbench.core.algorithms.ppo.models", "api/arlbench.core.algorithms.ppo.ppo", "api/arlbench.core.algorithms.prioritised_item_buffer", "api/arlbench.core.algorithms.sac", "api/arlbench.core.algorithms.sac.models", "api/arlbench.core.algorithms.sac.sac", "api/arlbench.core.environments", "api/arlbench.core.environments.autorl_env", "api/arlbench.core.environments.brax_env", "api/arlbench.core.environments.envpool_env", "api/arlbench.core.environments.gymnasium_env", "api/arlbench.core.environments.gymnax_env", "api/arlbench.core.environments.make_env", "api/arlbench.core.environments.xland_env", "api/arlbench.core.running_statistics", "api/arlbench.core.wrappers", "api/arlbench.core.wrappers.flatten_observation", "api/arlbench.core.wrappers.wrapper", "api/arlbench.utils", "api/arlbench.utils.common", "arlbench", "arlbench.autorl", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.sac", "arlbench.core.environments", "arlbench.core.wrappers", "arlbench.utils", "basic_usage/env_subsets", "basic_usage/index", "basic_usage/objectives", "basic_usage/options", "basic_usage/seeding", "contributing", "faq", "glossary", "index", "installation", "modules"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["advanced_usage/algorithm_states.rst", "advanced_usage/autorl_paradigms.rst", "advanced_usage/dynamic_configuration.rst", "advanced_usage/index.rst", "api.rst", "api/arlbench.rst", "api/arlbench.arlbench.rst", "api/arlbench.autorl.rst", "api/arlbench.autorl.autorl_env.rst", "api/arlbench.autorl.checkpointing.rst", "api/arlbench.autorl.objectives.rst", "api/arlbench.autorl.state_features.rst", "api/arlbench.core.rst", "api/arlbench.core.algorithms.rst", "api/arlbench.core.algorithms.algorithm.rst", "api/arlbench.core.algorithms.buffers.rst", "api/arlbench.core.algorithms.common.rst", "api/arlbench.core.algorithms.dqn.rst", "api/arlbench.core.algorithms.dqn.dqn.rst", "api/arlbench.core.algorithms.dqn.models.rst", "api/arlbench.core.algorithms.ppo.rst", "api/arlbench.core.algorithms.ppo.models.rst", "api/arlbench.core.algorithms.ppo.ppo.rst", "api/arlbench.core.algorithms.prioritised_item_buffer.rst", "api/arlbench.core.algorithms.sac.rst", "api/arlbench.core.algorithms.sac.models.rst", "api/arlbench.core.algorithms.sac.sac.rst", "api/arlbench.core.environments.rst", "api/arlbench.core.environments.autorl_env.rst", "api/arlbench.core.environments.brax_env.rst", "api/arlbench.core.environments.envpool_env.rst", "api/arlbench.core.environments.gymnasium_env.rst", "api/arlbench.core.environments.gymnax_env.rst", "api/arlbench.core.environments.make_env.rst", "api/arlbench.core.environments.xland_env.rst", "api/arlbench.core.running_statistics.rst", "api/arlbench.core.wrappers.rst", "api/arlbench.core.wrappers.flatten_observation.rst", "api/arlbench.core.wrappers.wrapper.rst", "api/arlbench.utils.rst", "api/arlbench.utils.common.rst", "arlbench.rst", "arlbench.autorl.rst", "arlbench.core.rst", "arlbench.core.algorithms.rst", "arlbench.core.algorithms.dqn.rst", "arlbench.core.algorithms.ppo.rst", "arlbench.core.algorithms.sac.rst", "arlbench.core.environments.rst", "arlbench.core.wrappers.rst", "arlbench.utils.rst", "basic_usage/env_subsets.rst", "basic_usage/index.rst", "basic_usage/objectives.rst", "basic_usage/options.rst", "basic_usage/seeding.rst", "contributing.rst", "faq.rst", "glossary.rst", "index.rst", "installation.rst", "modules.rst"], "indexentries": {"__call__() (arlbench.autorl.objectives.emissions static method)": [[10, "arlbench.autorl.objectives.Emissions.__call__", false], [42, "arlbench.autorl.objectives.Emissions.__call__", false]], "__call__() (arlbench.autorl.objectives.objective static method)": [[10, "arlbench.autorl.objectives.Objective.__call__", false], [42, "arlbench.autorl.objectives.Objective.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardmean static method)": [[10, "arlbench.autorl.objectives.RewardMean.__call__", false], [42, "arlbench.autorl.objectives.RewardMean.__call__", false]], "__call__() (arlbench.autorl.objectives.rewardstd static method)": [[10, "arlbench.autorl.objectives.RewardStd.__call__", false], [42, "arlbench.autorl.objectives.RewardStd.__call__", false]], "__call__() (arlbench.autorl.objectives.runtime static method)": [[10, "arlbench.autorl.objectives.Runtime.__call__", false], [42, "arlbench.autorl.objectives.Runtime.__call__", false]], "__call__() (arlbench.autorl.state_features.gradinfo static method)": [[11, "arlbench.autorl.state_features.GradInfo.__call__", false], [42, "arlbench.autorl.state_features.GradInfo.__call__", false]], "__call__() (arlbench.autorl.state_features.statefeature static method)": [[11, "arlbench.autorl.state_features.StateFeature.__call__", false], [42, "arlbench.autorl.state_features.StateFeature.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.cnnq method)": [[19, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false], [45, "arlbench.core.algorithms.dqn.models.CNNQ.__call__", false]], "__call__() (arlbench.core.algorithms.dqn.models.mlpq method)": [[19, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false], [45, "arlbench.core.algorithms.dqn.models.MLPQ.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false], [46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false], [46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.alphacoef method)": [[25, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false], [47, "arlbench.core.algorithms.sac.models.AlphaCoef.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACCNNActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACCNNCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACMLPActor.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACMLPCritic.__call__", false]], "__call__() (arlbench.core.algorithms.sac.models.sacvectorcritic method)": [[25, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false], [47, "arlbench.core.algorithms.sac.models.SACVectorCritic.__call__", false]], "__lt__() (arlbench.autorl.objectives.objective method)": [[10, "arlbench.autorl.objectives.Objective.__lt__", false], [42, "arlbench.autorl.objectives.Objective.__lt__", false]], "__new__() (arlbench.autorl.objectives.objective static method)": [[10, "arlbench.autorl.objectives.Objective.__new__", false], [42, "arlbench.autorl.objectives.Objective.__new__", false]], "__new__() (arlbench.autorl.state_features.statefeature static method)": [[11, "arlbench.autorl.state_features.StateFeature.__new__", false], [42, "arlbench.autorl.state_features.StateFeature.__new__", false]], "action (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.action", false]], "action (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.action", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.action", false]], "action (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.action", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.action", false]], "action (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.action", false], [47, "arlbench.core.algorithms.sac.sac.Transition.action", false]], "action_dim (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.action_dim", false]], "action_dim (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.action_dim", false]], "action_dim (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.action_dim", false]], "action_space (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.action_space", false]], "action_space (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.action_space", false], [42, "arlbench.autorl.AutoRLEnv.action_space", false]], "action_space (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.action_space", false], [41, "arlbench.AutoRLEnv.action_space", false]], "action_space (arlbench.core.environments.brax_env.braxenv property)": [[29, "arlbench.core.environments.brax_env.BraxEnv.action_space", false], [48, "arlbench.core.environments.brax_env.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.braxenv property)": [[27, "arlbench.core.environments.BraxEnv.action_space", false], [48, "arlbench.core.environments.BraxEnv.action_space", false]], "action_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[30, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false], [48, "arlbench.core.environments.envpool_env.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.envpoolenv property)": [[27, "arlbench.core.environments.EnvpoolEnv.action_space", false], [48, "arlbench.core.environments.EnvpoolEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[31, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false], [48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnasiumenv property)": [[27, "arlbench.core.environments.GymnasiumEnv.action_space", false], [48, "arlbench.core.environments.GymnasiumEnv.action_space", false]], "action_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[32, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false], [48, "arlbench.core.environments.gymnax_env.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.gymnaxenv property)": [[27, "arlbench.core.environments.GymnaxEnv.action_space", false], [48, "arlbench.core.environments.GymnaxEnv.action_space", false]], "action_space (arlbench.core.environments.xland_env.xlandenv property)": [[34, "arlbench.core.environments.xland_env.XLandEnv.action_space", false], [48, "arlbench.core.environments.xland_env.XLandEnv.action_space", false]], "action_space() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.action_space", false], [48, "arlbench.core.environments.autorl_env.Environment.action_space", false]], "action_space() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.action_space", false], [48, "arlbench.core.environments.Environment.action_space", false]], "action_type (arlbench.core.algorithms.algorithm property)": [[13, "arlbench.core.algorithms.Algorithm.action_type", false], [44, "arlbench.core.algorithms.Algorithm.action_type", false]], "action_type (arlbench.core.algorithms.algorithm.algorithm property)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.action_type", false]], "activation (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.activation", false]], "activation (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.activation", false]], "activation (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.activation", false]], "activation (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.activation", false]], "activation (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.activation", false]], "actor_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_grads", false]], "actor_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false], [47, "arlbench.core.algorithms.sac.SACMetrics.actor_grads", false]], "actor_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.actor_loss", false]], "actor_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false], [47, "arlbench.core.algorithms.sac.SACMetrics.actor_loss", false]], "actor_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.actor_train_state", false]], "actor_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.actor_train_state", false]], "advantages (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.advantages", false]], "advantages (arlbench.core.algorithms.ppo.ppometrics attribute)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics.advantages", false]], "algorithm (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.Algorithm", false], [44, "arlbench.core.algorithms.Algorithm", false]], "algorithm (class in arlbench.core.algorithms.algorithm)": [[14, "arlbench.core.algorithms.algorithm.Algorithm", false], [44, "arlbench.core.algorithms.algorithm.Algorithm", false]], "algorithms (arlbench.autorl.autorl_env.autorlenv attribute)": [[42, "arlbench.autorl.autorl_env.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorl.autorlenv attribute)": [[42, "arlbench.autorl.AutoRLEnv.ALGORITHMS", false]], "algorithms (arlbench.autorlenv attribute)": [[41, "arlbench.AutoRLEnv.ALGORITHMS", false]], "alpha_init (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.alpha_init", false]], "alpha_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.alpha_loss", false]], "alpha_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false], [47, "arlbench.core.algorithms.sac.SACMetrics.alpha_loss", false]], "alpha_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.alpha_train_state", false]], "alpha_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.alpha_train_state", false]], "alphacoef (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.AlphaCoef", false], [47, "arlbench.core.algorithms.sac.models.AlphaCoef", false]], "arlbench": [[5, "module-arlbench", false], [41, "module-arlbench", false]], "arlbench.arlbench": [[6, "module-arlbench.arlbench", false], [41, "module-arlbench.arlbench", false]], "arlbench.autorl": [[7, "module-arlbench.autorl", false], [42, "module-arlbench.autorl", false]], "arlbench.autorl.autorl_env": [[8, "module-arlbench.autorl.autorl_env", false], [42, "module-arlbench.autorl.autorl_env", false]], "arlbench.autorl.checkpointing": [[9, "module-arlbench.autorl.checkpointing", false], [42, "module-arlbench.autorl.checkpointing", false]], "arlbench.autorl.objectives": [[10, "module-arlbench.autorl.objectives", false], [42, "module-arlbench.autorl.objectives", false]], "arlbench.autorl.state_features": [[11, "module-arlbench.autorl.state_features", false], [42, "module-arlbench.autorl.state_features", false]], "arlbench.core": [[12, "module-arlbench.core", false], [43, "module-arlbench.core", false]], "arlbench.core.algorithms": [[13, "module-arlbench.core.algorithms", false], [44, "module-arlbench.core.algorithms", false]], "arlbench.core.algorithms.algorithm": [[14, "module-arlbench.core.algorithms.algorithm", false], [44, "module-arlbench.core.algorithms.algorithm", false]], "arlbench.core.algorithms.buffers": [[15, "module-arlbench.core.algorithms.buffers", false], [44, "module-arlbench.core.algorithms.buffers", false]], "arlbench.core.algorithms.common": [[16, "module-arlbench.core.algorithms.common", false], [44, "module-arlbench.core.algorithms.common", false]], "arlbench.core.algorithms.dqn": [[17, "module-arlbench.core.algorithms.dqn", false], [45, "module-arlbench.core.algorithms.dqn", false]], "arlbench.core.algorithms.dqn.dqn": [[18, "module-arlbench.core.algorithms.dqn.dqn", false], [45, "module-arlbench.core.algorithms.dqn.dqn", false]], "arlbench.core.algorithms.dqn.models": [[19, "module-arlbench.core.algorithms.dqn.models", false], [45, "module-arlbench.core.algorithms.dqn.models", false]], "arlbench.core.algorithms.ppo": [[20, "module-arlbench.core.algorithms.ppo", false], [46, "module-arlbench.core.algorithms.ppo", false]], "arlbench.core.algorithms.ppo.models": [[21, "module-arlbench.core.algorithms.ppo.models", false], [46, "module-arlbench.core.algorithms.ppo.models", false]], "arlbench.core.algorithms.ppo.ppo": [[22, "module-arlbench.core.algorithms.ppo.ppo", false], [46, "module-arlbench.core.algorithms.ppo.ppo", false]], "arlbench.core.algorithms.prioritised_item_buffer": [[23, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [44, "module-arlbench.core.algorithms.prioritised_item_buffer", false]], "arlbench.core.algorithms.sac": [[24, "module-arlbench.core.algorithms.sac", false], [47, "module-arlbench.core.algorithms.sac", false]], "arlbench.core.algorithms.sac.models": [[25, "module-arlbench.core.algorithms.sac.models", false], [47, "module-arlbench.core.algorithms.sac.models", false]], "arlbench.core.algorithms.sac.sac": [[26, "module-arlbench.core.algorithms.sac.sac", false], [47, "module-arlbench.core.algorithms.sac.sac", false]], "arlbench.core.environments": [[27, "module-arlbench.core.environments", false], [48, "module-arlbench.core.environments", false]], "arlbench.core.environments.autorl_env": [[28, "module-arlbench.core.environments.autorl_env", false], [48, "module-arlbench.core.environments.autorl_env", false]], "arlbench.core.environments.brax_env": [[29, "module-arlbench.core.environments.brax_env", false], [48, "module-arlbench.core.environments.brax_env", false]], "arlbench.core.environments.envpool_env": [[30, "module-arlbench.core.environments.envpool_env", false], [48, "module-arlbench.core.environments.envpool_env", false]], "arlbench.core.environments.gymnasium_env": [[31, "module-arlbench.core.environments.gymnasium_env", false], [48, "module-arlbench.core.environments.gymnasium_env", false]], "arlbench.core.environments.gymnax_env": [[32, "module-arlbench.core.environments.gymnax_env", false], [48, "module-arlbench.core.environments.gymnax_env", false]], "arlbench.core.environments.make_env": [[48, "module-arlbench.core.environments.make_env", false]], "arlbench.core.environments.xland_env": [[34, "module-arlbench.core.environments.xland_env", false], [48, "module-arlbench.core.environments.xland_env", false]], "arlbench.core.running_statistics": [[35, "module-arlbench.core.running_statistics", false], [43, "module-arlbench.core.running_statistics", false]], "arlbench.core.wrappers": [[36, "module-arlbench.core.wrappers", false], [49, "module-arlbench.core.wrappers", false]], "arlbench.core.wrappers.flatten_observation": [[37, "module-arlbench.core.wrappers.flatten_observation", false], [49, "module-arlbench.core.wrappers.flatten_observation", false]], "arlbench.core.wrappers.wrapper": [[38, "module-arlbench.core.wrappers.wrapper", false], [49, "module-arlbench.core.wrappers.wrapper", false]], "arlbench.utils": [[39, "module-arlbench.utils", false], [50, "module-arlbench.utils", false]], "arlbench.utils.common": [[40, "module-arlbench.utils.common", false], [50, "module-arlbench.utils.common", false]], "automl": [[58, "term-AutoML", true]], "autorl": [[58, "term-AutoRL", true]], "autorlenv (class in arlbench)": [[5, "arlbench.AutoRLEnv", false], [41, "arlbench.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl)": [[7, "arlbench.autorl.AutoRLEnv", false], [42, "arlbench.autorl.AutoRLEnv", false]], "autorlenv (class in arlbench.autorl.autorl_env)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv", false]], "bo": [[58, "term-BO", true]], "braxenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.BraxEnv", false], [48, "arlbench.core.environments.BraxEnv", false]], "braxenv (class in arlbench.core.environments.brax_env)": [[29, "arlbench.core.environments.brax_env.BraxEnv", false], [48, "arlbench.core.environments.brax_env.BraxEnv", false]], "buffer_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false], [45, "arlbench.core.algorithms.dqn.DQNState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[20, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false], [46, "arlbench.core.algorithms.ppo.PPOState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false], [47, "arlbench.core.algorithms.sac.sac.SACState.buffer_state", false]], "buffer_state (arlbench.core.algorithms.sac.sacstate attribute)": [[24, "arlbench.core.algorithms.sac.SACState.buffer_state", false], [47, "arlbench.core.algorithms.sac.SACState.buffer_state", false]], "checkpointer (class in arlbench.autorl.checkpointing)": [[9, "arlbench.autorl.checkpointing.Checkpointer", false], [42, "arlbench.autorl.checkpointing.Checkpointer", false]], "checkpoints (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.checkpoints", false], [42, "arlbench.autorl.AutoRLEnv.checkpoints", false]], "checkpoints (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.checkpoints", false], [41, "arlbench.AutoRLEnv.checkpoints", false]], "cnnactorcritic (class in arlbench.core.algorithms.ppo.models)": [[21, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false], [46, "arlbench.core.algorithms.ppo.models.CNNActorCritic", false]], "cnnq (class in arlbench.core.algorithms.dqn.models)": [[19, "arlbench.core.algorithms.dqn.models.CNNQ", false], [45, "arlbench.core.algorithms.dqn.models.CNNQ", false]], "config (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.config", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.config", false]], "config (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.config", false], [42, "arlbench.autorl.AutoRLEnv.config", false]], "config (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.config", false], [41, "arlbench.AutoRLEnv.config", false]], "config_space (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.config_space", false]], "config_space (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.config_space", false], [42, "arlbench.autorl.AutoRLEnv.config_space", false]], "config_space (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.config_space", false], [41, "arlbench.AutoRLEnv.config_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils)": [[39, "arlbench.utils.config_space_to_gymnasium_space", false], [50, "arlbench.utils.config_space_to_gymnasium_space", false]], "config_space_to_gymnasium_space() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.config_space_to_gymnasium_space", false], [50, "arlbench.utils.common.config_space_to_gymnasium_space", false]], "config_space_to_yaml() (in module arlbench.utils)": [[39, "arlbench.utils.config_space_to_yaml", false], [50, "arlbench.utils.config_space_to_yaml", false]], "config_space_to_yaml() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.config_space_to_yaml", false], [50, "arlbench.utils.common.config_space_to_yaml", false]], "count (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[43, "arlbench.core.running_statistics.RunningStatisticsState.count", false]], "create_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[23, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false], [44, "arlbench.core.algorithms.prioritised_item_buffer.create_prioritised_item_buffer", false]], "create_with_opt_state() (arlbench.core.algorithms.dqn.dqn.dqntrainstate class method)": [[45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.ppo.ppo.ppotrainstate class method)": [[46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.create_with_opt_state", false]], "create_with_opt_state() (arlbench.core.algorithms.sac.sac.sactrainstate class method)": [[47, "arlbench.core.algorithms.sac.sac.SACTrainState.create_with_opt_state", false]], "critic (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.critic", false]], "critic_grads (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_grads", false]], "critic_grads (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false], [47, "arlbench.core.algorithms.sac.SACMetrics.critic_grads", false]], "critic_loss (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.critic_loss", false]], "critic_loss (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false], [47, "arlbench.core.algorithms.sac.SACMetrics.critic_loss", false]], "critic_train_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.critic_train_state", false]], "critic_train_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.critic_train_state", false]], "cur_rewards (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.cur_rewards", false]], "cur_rewards (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.cur_rewards", false]], "denormalize() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.denormalize", false], [43, "arlbench.core.running_statistics.denormalize", false]], "discrete (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.discrete", false]], "discrete (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.discrete", false]], "discrete (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.discrete", false]], "done (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.done", false]], "done (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.done", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.done", false]], "done (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.done", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.done", false]], "done (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.done", false], [47, "arlbench.core.algorithms.sac.sac.Transition.done", false]], "dqn": [[58, "term-DQN", true]], "dqn (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.DQN", false], [44, "arlbench.core.algorithms.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQN", false], [45, "arlbench.core.algorithms.dqn.DQN", false]], "dqn (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics", false]], "dqnmetrics (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState", false]], "dqnrunnerstate (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState", false]], "dqnstate (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNState", false], [45, "arlbench.core.algorithms.dqn.DQNState", false]], "dqnstate (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNState", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNState", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult", false]], "dqntrainingresult (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult", false]], "dqntrainreturnt (in module arlbench.core.algorithms.dqn)": [[17, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false], [45, "arlbench.core.algorithms.dqn.DQNTrainReturnT", false]], "dqntrainstate (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState", false]], "emissions (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.Emissions", false], [42, "arlbench.autorl.objectives.Emissions", false]], "env_name (arlbench.core.environments.autorl_env.environment property)": [[28, "arlbench.core.environments.autorl_env.Environment.env_name", false], [48, "arlbench.core.environments.autorl_env.Environment.env_name", false]], "env_name (arlbench.core.environments.environment property)": [[27, "arlbench.core.environments.Environment.env_name", false], [48, "arlbench.core.environments.Environment.env_name", false]], "env_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.env_state", false]], "env_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.env_state", false]], "environment (class in arlbench.core.environments)": [[27, "arlbench.core.environments.Environment", false], [48, "arlbench.core.environments.Environment", false]], "environment (class in arlbench.core.environments.autorl_env)": [[28, "arlbench.core.environments.autorl_env.Environment", false], [48, "arlbench.core.environments.autorl_env.Environment", false]], "envpoolenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.EnvpoolEnv", false], [48, "arlbench.core.environments.EnvpoolEnv", false]], "envpoolenv (class in arlbench.core.environments.envpool_env)": [[30, "arlbench.core.environments.envpool_env.EnvpoolEnv", false], [48, "arlbench.core.environments.envpool_env.EnvpoolEnv", false]], "eval() (arlbench.autorl.autorl_env.autorlenv method)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.eval", false]], "eval() (arlbench.autorl.autorlenv method)": [[7, "arlbench.autorl.AutoRLEnv.eval", false], [42, "arlbench.autorl.AutoRLEnv.eval", false]], "eval() (arlbench.autorlenv method)": [[5, "arlbench.AutoRLEnv.eval", false], [41, "arlbench.AutoRLEnv.eval", false]], "eval() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.eval", false], [44, "arlbench.core.algorithms.Algorithm.eval", false]], "eval() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.eval", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.eval", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult.eval_rewards", false]], "eval_rewards (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult.eval_rewards", false]], "flattenobservationwrapper (class in arlbench.core.wrappers)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper", false]], "flattenobservationwrapper (class in arlbench.core.wrappers.flatten_observation)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper", false]], "from_tuple() (arlbench.core.algorithms.common.timestep method)": [[44, "arlbench.core.algorithms.common.TimeStep.from_tuple", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false], [45, "arlbench.core.algorithms.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false], [46, "arlbench.core.algorithms.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false], [44, "arlbench.core.algorithms.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false], [47, "arlbench.core.algorithms.sac.SAC.get_checkpoint_factory", false]], "get_checkpoint_factory() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_checkpoint_factory", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false], [44, "arlbench.core.algorithms.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_default_hpo_config", false], [44, "arlbench.core.algorithms.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false], [45, "arlbench.core.algorithms.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_default_hpo_config", false], [44, "arlbench.core.algorithms.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false], [46, "arlbench.core.algorithms.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_default_hpo_config", false], [44, "arlbench.core.algorithms.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false], [47, "arlbench.core.algorithms.sac.SAC.get_default_hpo_config", false]], "get_default_hpo_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_default_hpo_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false], [44, "arlbench.core.algorithms.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_default_nas_config", false], [44, "arlbench.core.algorithms.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false], [45, "arlbench.core.algorithms.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_default_nas_config", false], [44, "arlbench.core.algorithms.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false], [46, "arlbench.core.algorithms.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_default_nas_config", false], [44, "arlbench.core.algorithms.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false], [47, "arlbench.core.algorithms.sac.SAC.get_default_nas_config", false]], "get_default_nas_config() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_default_nas_config", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false], [44, "arlbench.core.algorithms.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_hpo_config_space", false], [44, "arlbench.core.algorithms.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false], [45, "arlbench.core.algorithms.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_hpo_config_space", false], [44, "arlbench.core.algorithms.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false], [46, "arlbench.core.algorithms.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_hpo_config_space", false], [44, "arlbench.core.algorithms.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false], [47, "arlbench.core.algorithms.sac.SAC.get_hpo_config_space", false]], "get_hpo_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_config_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false], [44, "arlbench.core.algorithms.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_hpo_search_space", false], [44, "arlbench.core.algorithms.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false], [45, "arlbench.core.algorithms.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_hpo_search_space", false], [44, "arlbench.core.algorithms.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false], [46, "arlbench.core.algorithms.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_hpo_search_space", false], [44, "arlbench.core.algorithms.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false], [47, "arlbench.core.algorithms.sac.SAC.get_hpo_search_space", false]], "get_hpo_search_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_hpo_search_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm static method)": [[13, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false], [44, "arlbench.core.algorithms.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.algorithm.algorithm static method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn static method)": [[13, "arlbench.core.algorithms.DQN.get_nas_config_space", false], [44, "arlbench.core.algorithms.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn static method)": [[17, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false], [45, "arlbench.core.algorithms.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.dqn.dqn.dqn static method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo static method)": [[13, "arlbench.core.algorithms.PPO.get_nas_config_space", false], [44, "arlbench.core.algorithms.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo static method)": [[20, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false], [46, "arlbench.core.algorithms.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.ppo.ppo.ppo static method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac static method)": [[13, "arlbench.core.algorithms.SAC.get_nas_config_space", false], [44, "arlbench.core.algorithms.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac static method)": [[24, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false], [47, "arlbench.core.algorithms.sac.SAC.get_nas_config_space", false]], "get_nas_config_space() (arlbench.core.algorithms.sac.sac.sac static method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false], [47, "arlbench.core.algorithms.sac.sac.SAC.get_nas_config_space", false]], "get_spec() (arlbench.autorl.objectives.emissions static method)": [[10, "arlbench.autorl.objectives.Emissions.get_spec", false], [42, "arlbench.autorl.objectives.Emissions.get_spec", false]], "get_spec() (arlbench.autorl.objectives.objective static method)": [[10, "arlbench.autorl.objectives.Objective.get_spec", false], [42, "arlbench.autorl.objectives.Objective.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardmean static method)": [[10, "arlbench.autorl.objectives.RewardMean.get_spec", false], [42, "arlbench.autorl.objectives.RewardMean.get_spec", false]], "get_spec() (arlbench.autorl.objectives.rewardstd static method)": [[10, "arlbench.autorl.objectives.RewardStd.get_spec", false], [42, "arlbench.autorl.objectives.RewardStd.get_spec", false]], "get_spec() (arlbench.autorl.objectives.runtime static method)": [[10, "arlbench.autorl.objectives.Runtime.get_spec", false], [42, "arlbench.autorl.objectives.Runtime.get_spec", false]], "get_state_space() (arlbench.autorl.state_features.gradinfo static method)": [[11, "arlbench.autorl.state_features.GradInfo.get_state_space", false], [42, "arlbench.autorl.state_features.GradInfo.get_state_space", false]], "get_state_space() (arlbench.autorl.state_features.statefeature static method)": [[11, "arlbench.autorl.state_features.StateFeature.get_state_space", false], [42, "arlbench.autorl.state_features.StateFeature.get_state_space", false]], "global_step (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.global_step", false]], "global_step (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.global_step", false]], "gradinfo (class in arlbench.autorl.state_features)": [[11, "arlbench.autorl.state_features.GradInfo", false], [42, "arlbench.autorl.state_features.GradInfo", false]], "grads (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.grads", false]], "grads (arlbench.core.algorithms.ppo.ppometrics attribute)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics.grads", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils)": [[39, "arlbench.utils.gymnasium_space_to_gymnax_space", false], [50, "arlbench.utils.gymnasium_space_to_gymnax_space", false]], "gymnasium_space_to_gymnax_space() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false], [50, "arlbench.utils.common.gymnasium_space_to_gymnax_space", false]], "gymnasiumenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.GymnasiumEnv", false], [48, "arlbench.core.environments.GymnasiumEnv", false]], "gymnasiumenv (class in arlbench.core.environments.gymnasium_env)": [[31, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false], [48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv", false]], "gymnaxenv (class in arlbench.core.environments)": [[27, "arlbench.core.environments.GymnaxEnv", false], [48, "arlbench.core.environments.GymnaxEnv", false]], "gymnaxenv (class in arlbench.core.environments.gymnax_env)": [[32, "arlbench.core.environments.gymnax_env.GymnaxEnv", false], [48, "arlbench.core.environments.gymnax_env.GymnaxEnv", false]], "hidden_size (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.hidden_size", false]], "hidden_size (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.hidden_size", false]], "hpo": [[58, "term-HPO", true]], "hpo_config (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.hpo_config", false], [42, "arlbench.autorl.AutoRLEnv.hpo_config", false]], "hpo_config (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.hpo_config", false], [41, "arlbench.AutoRLEnv.hpo_config", false]], "info (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.info", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.info", false]], "info (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.info", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.info", false]], "info (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.info", false], [47, "arlbench.core.algorithms.sac.sac.Transition.info", false]], "init() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.init", false], [44, "arlbench.core.algorithms.Algorithm.init", false]], "init() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.init", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.init", false]], "init() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.init", false], [44, "arlbench.core.algorithms.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.init", false], [45, "arlbench.core.algorithms.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.init", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.init", false]], "init() (arlbench.core.algorithms.ppo method)": [[13, "arlbench.core.algorithms.PPO.init", false], [44, "arlbench.core.algorithms.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo method)": [[20, "arlbench.core.algorithms.ppo.PPO.init", false], [46, "arlbench.core.algorithms.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.init", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.init", false]], "init() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.init", false], [44, "arlbench.core.algorithms.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.init", false], [47, "arlbench.core.algorithms.sac.SAC.init", false]], "init() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.init", false], [47, "arlbench.core.algorithms.sac.sac.SAC.init", false]], "init_state() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.init_state", false], [43, "arlbench.core.running_statistics.init_state", false]], "items() (arlbench.core.algorithms.common.timestep method)": [[16, "arlbench.core.algorithms.common.TimeStep.items", false], [44, "arlbench.core.algorithms.common.TimeStep.items", false]], "key (arlbench.autorl.objectives.emissions attribute)": [[42, "arlbench.autorl.objectives.Emissions.KEY", false]], "key (arlbench.autorl.objectives.objective attribute)": [[42, "arlbench.autorl.objectives.Objective.KEY", false]], "key (arlbench.autorl.objectives.rewardmean attribute)": [[42, "arlbench.autorl.objectives.RewardMean.KEY", false]], "key (arlbench.autorl.objectives.rewardstd attribute)": [[42, "arlbench.autorl.objectives.RewardStd.KEY", false]], "key (arlbench.autorl.objectives.runtime attribute)": [[42, "arlbench.autorl.objectives.Runtime.KEY", false]], "key (arlbench.autorl.state_features.gradinfo attribute)": [[42, "arlbench.autorl.state_features.GradInfo.KEY", false]], "key (arlbench.autorl.state_features.statefeature attribute)": [[42, "arlbench.autorl.state_features.StateFeature.KEY", false]], "keys() (arlbench.core.algorithms.common.timestep method)": [[16, "arlbench.core.algorithms.common.TimeStep.keys", false], [44, "arlbench.core.algorithms.common.TimeStep.keys", false]], "last_obs (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.last_obs", false]], "load() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.load", false], [42, "arlbench.autorl.checkpointing.Checkpointer.load", false]], "load_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false], [42, "arlbench.autorl.checkpointing.Checkpointer.load_buffer", false]], "log_prob (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.log_prob", false]], "log_std_max (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_max", false]], "log_std_max (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_max", false]], "log_std_min (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.log_std_min", false]], "log_std_min (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.log_std_min", false]], "loss (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppo.ppometrics attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics.loss", false]], "loss (arlbench.core.algorithms.ppo.ppometrics attribute)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics.loss", false]], "make_env() (in module arlbench.core.environments)": [[27, "arlbench.core.environments.make_env", false], [33, "arlbench.core.environments.make_env", false], [48, "arlbench.core.environments.make_env", false]], "make_env() (in module arlbench.core.environments.make_env)": [[48, "arlbench.core.environments.make_env.make_env", false]], "make_prioritised_item_buffer() (in module arlbench.core.algorithms.prioritised_item_buffer)": [[23, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false], [44, "arlbench.core.algorithms.prioritised_item_buffer.make_prioritised_item_buffer", false]], "mean (arlbench.core.running_statistics.nestedmeanstd attribute)": [[43, "arlbench.core.running_statistics.NestedMeanStd.mean", false]], "metrics (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult.metrics", false]], "metrics (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult.metrics", false]], "mlpactorcritic (class in arlbench.core.algorithms.ppo.models)": [[21, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false], [46, "arlbench.core.algorithms.ppo.models.MLPActorCritic", false]], "mlpq (class in arlbench.core.algorithms.dqn.models)": [[19, "arlbench.core.algorithms.dqn.models.MLPQ", false], [45, "arlbench.core.algorithms.dqn.models.MLPQ", false]], "mode() (arlbench.core.algorithms.sac.models.tanhtransformeddistribution method)": [[25, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false], [47, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution.mode", false]], "module": [[5, "module-arlbench", false], [6, "module-arlbench.arlbench", false], [7, "module-arlbench.autorl", false], [8, "module-arlbench.autorl.autorl_env", false], [9, "module-arlbench.autorl.checkpointing", false], [10, "module-arlbench.autorl.objectives", false], [11, "module-arlbench.autorl.state_features", false], [12, "module-arlbench.core", false], [13, "module-arlbench.core.algorithms", false], [14, "module-arlbench.core.algorithms.algorithm", false], [15, "module-arlbench.core.algorithms.buffers", false], [16, "module-arlbench.core.algorithms.common", false], [17, "module-arlbench.core.algorithms.dqn", false], [18, "module-arlbench.core.algorithms.dqn.dqn", false], [19, "module-arlbench.core.algorithms.dqn.models", false], [20, "module-arlbench.core.algorithms.ppo", false], [21, "module-arlbench.core.algorithms.ppo.models", false], [22, "module-arlbench.core.algorithms.ppo.ppo", false], [23, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [24, "module-arlbench.core.algorithms.sac", false], [25, "module-arlbench.core.algorithms.sac.models", false], [26, "module-arlbench.core.algorithms.sac.sac", false], [27, "module-arlbench.core.environments", false], [28, "module-arlbench.core.environments.autorl_env", false], [29, "module-arlbench.core.environments.brax_env", false], [30, "module-arlbench.core.environments.envpool_env", false], [31, "module-arlbench.core.environments.gymnasium_env", false], [32, "module-arlbench.core.environments.gymnax_env", false], [34, "module-arlbench.core.environments.xland_env", false], [35, "module-arlbench.core.running_statistics", false], [36, "module-arlbench.core.wrappers", false], [37, "module-arlbench.core.wrappers.flatten_observation", false], [38, "module-arlbench.core.wrappers.wrapper", false], [39, "module-arlbench.utils", false], [40, "module-arlbench.utils.common", false], [41, "module-arlbench", false], [41, "module-arlbench.arlbench", false], [42, "module-arlbench.autorl", false], [42, "module-arlbench.autorl.autorl_env", false], [42, "module-arlbench.autorl.checkpointing", false], [42, "module-arlbench.autorl.objectives", false], [42, "module-arlbench.autorl.state_features", false], [43, "module-arlbench.core", false], [43, "module-arlbench.core.running_statistics", false], [44, "module-arlbench.core.algorithms", false], [44, "module-arlbench.core.algorithms.algorithm", false], [44, "module-arlbench.core.algorithms.buffers", false], [44, "module-arlbench.core.algorithms.common", false], [44, "module-arlbench.core.algorithms.prioritised_item_buffer", false], [45, "module-arlbench.core.algorithms.dqn", false], [45, "module-arlbench.core.algorithms.dqn.dqn", false], [45, "module-arlbench.core.algorithms.dqn.models", false], [46, "module-arlbench.core.algorithms.ppo", false], [46, "module-arlbench.core.algorithms.ppo.models", false], [46, "module-arlbench.core.algorithms.ppo.ppo", false], [47, "module-arlbench.core.algorithms.sac", false], [47, "module-arlbench.core.algorithms.sac.models", false], [47, "module-arlbench.core.algorithms.sac.sac", false], [48, "module-arlbench.core.environments", false], [48, "module-arlbench.core.environments.autorl_env", false], [48, "module-arlbench.core.environments.brax_env", false], [48, "module-arlbench.core.environments.envpool_env", false], [48, "module-arlbench.core.environments.gymnasium_env", false], [48, "module-arlbench.core.environments.gymnax_env", false], [48, "module-arlbench.core.environments.make_env", false], [48, "module-arlbench.core.environments.xland_env", false], [49, "module-arlbench.core.wrappers", false], [49, "module-arlbench.core.wrappers.flatten_observation", false], [49, "module-arlbench.core.wrappers.wrapper", false], [50, "module-arlbench.utils", false], [50, "module-arlbench.utils.common", false]], "mrp_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[42, "arlbench.autorl.checkpointing.Checkpointer.MRP_FILE", false]], "multi-fidelity optimization": [[58, "term-Multi-fidelity-optimization", true]], "n_critics (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.n_critics", false]], "n_envs (arlbench.core.environments.autorl_env.environment property)": [[28, "arlbench.core.environments.autorl_env.Environment.n_envs", false], [48, "arlbench.core.environments.autorl_env.Environment.n_envs", false]], "n_envs (arlbench.core.environments.environment property)": [[27, "arlbench.core.environments.Environment.n_envs", false], [48, "arlbench.core.environments.Environment.n_envs", false]], "name (arlbench.core.algorithms.algorithm attribute)": [[44, "arlbench.core.algorithms.Algorithm.name", false]], "name (arlbench.core.algorithms.algorithm.algorithm attribute)": [[44, "arlbench.core.algorithms.algorithm.Algorithm.name", false]], "name (arlbench.core.algorithms.dqn attribute)": [[44, "arlbench.core.algorithms.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn attribute)": [[45, "arlbench.core.algorithms.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.dqn.dqn attribute)": [[45, "arlbench.core.algorithms.dqn.dqn.DQN.name", false]], "name (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.name", false]], "name (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.name", false]], "name (arlbench.core.algorithms.ppo attribute)": [[44, "arlbench.core.algorithms.PPO.name", false]], "name (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.name", false]], "name (arlbench.core.algorithms.ppo.ppo attribute)": [[46, "arlbench.core.algorithms.ppo.PPO.name", false]], "name (arlbench.core.algorithms.ppo.ppo.ppo attribute)": [[46, "arlbench.core.algorithms.ppo.ppo.PPO.name", false]], "name (arlbench.core.algorithms.sac attribute)": [[44, "arlbench.core.algorithms.SAC.name", false]], "name (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.name", false]], "name (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.name", false]], "name (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.name", false]], "name (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.name", false]], "name (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.name", false]], "name (arlbench.core.algorithms.sac.sac attribute)": [[47, "arlbench.core.algorithms.sac.SAC.name", false]], "name (arlbench.core.algorithms.sac.sac.sac attribute)": [[47, "arlbench.core.algorithms.sac.sac.SAC.name", false]], "nestedmeanstd (class in arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.NestedMeanStd", false], [43, "arlbench.core.running_statistics.NestedMeanStd", false]], "network_state (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[47, "arlbench.core.algorithms.sac.sac.SACTrainState.network_state", false]], "nodes_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[42, "arlbench.autorl.checkpointing.Checkpointer.NODES_FILE", false]], "normalize() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.normalize", false], [43, "arlbench.core.running_statistics.normalize", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.normalizer_state", false]], "normalizer_state (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.normalizer_state", false]], "numpy_to_jax() (in module arlbench.core.environments.envpool_env)": [[30, "arlbench.core.environments.envpool_env.numpy_to_jax", false], [48, "arlbench.core.environments.envpool_env.numpy_to_jax", false]], "objective (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.Objective", false], [42, "arlbench.autorl.objectives.Objective", false]], "objectives (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.objectives", false]], "objectives (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.objectives", false], [42, "arlbench.autorl.AutoRLEnv.objectives", false]], "objectives (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.objectives", false], [41, "arlbench.AutoRLEnv.objectives", false]], "obs (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.obs", false]], "obs (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.obs", false]], "obs (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.obs", false]], "obs (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.obs", false], [47, "arlbench.core.algorithms.sac.sac.Transition.obs", false]], "obs (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.obs", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.obs", false]], "observation_space (arlbench.autorl.autorl_env.autorlenv property)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorl.autorlenv property)": [[7, "arlbench.autorl.AutoRLEnv.observation_space", false], [42, "arlbench.autorl.AutoRLEnv.observation_space", false]], "observation_space (arlbench.autorlenv property)": [[5, "arlbench.AutoRLEnv.observation_space", false], [41, "arlbench.AutoRLEnv.observation_space", false]], "observation_space (arlbench.core.environments.brax_env.braxenv property)": [[29, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false], [48, "arlbench.core.environments.brax_env.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.braxenv property)": [[27, "arlbench.core.environments.BraxEnv.observation_space", false], [48, "arlbench.core.environments.BraxEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpool_env.envpoolenv property)": [[30, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false], [48, "arlbench.core.environments.envpool_env.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.envpoolenv property)": [[27, "arlbench.core.environments.EnvpoolEnv.observation_space", false], [48, "arlbench.core.environments.EnvpoolEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasium_env.gymnasiumenv property)": [[31, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false], [48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnasiumenv property)": [[27, "arlbench.core.environments.GymnasiumEnv.observation_space", false], [48, "arlbench.core.environments.GymnasiumEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnax_env.gymnaxenv property)": [[32, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false], [48, "arlbench.core.environments.gymnax_env.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.gymnaxenv property)": [[27, "arlbench.core.environments.GymnaxEnv.observation_space", false], [48, "arlbench.core.environments.GymnaxEnv.observation_space", false]], "observation_space (arlbench.core.environments.xland_env.xlandenv property)": [[34, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false], [48, "arlbench.core.environments.xland_env.XLandEnv.observation_space", false]], "observation_space (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper property)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.observation_space", false]], "observation_space (arlbench.core.wrappers.flattenobservationwrapper property)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper.observation_space", false]], "observation_space() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.observation_space", false], [48, "arlbench.core.environments.autorl_env.Environment.observation_space", false]], "observation_space() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.observation_space", false], [48, "arlbench.core.environments.Environment.observation_space", false]], "opt_state (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.opt_state", false]], "opt_state (arlbench.core.algorithms.ppo.ppo.ppotrainstate attribute)": [[46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.opt_state", false]], "parent (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.parent", false]], "parent (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.parent", false]], "parent (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.parent", false]], "parent (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.parent", false]], "parent (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.parent", false]], "ppo": [[58, "term-PPO", true]], "ppo (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.PPO", false], [44, "arlbench.core.algorithms.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPO", false], [46, "arlbench.core.algorithms.ppo.PPO", false]], "ppo (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO", false]], "ppometrics (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOMetrics", false], [46, "arlbench.core.algorithms.ppo.PPOMetrics", false]], "ppometrics (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOMetrics", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState", false]], "pporunnerstate (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState", false]], "ppostate (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOState", false], [46, "arlbench.core.algorithms.ppo.PPOState", false]], "ppostate (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOState", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOState", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult", false]], "ppotrainingresult (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult", false]], "ppotrainreturnt (in module arlbench.core.algorithms.ppo)": [[20, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false], [46, "arlbench.core.algorithms.ppo.PPOTrainReturnT", false]], "ppotrainstate (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState", false]], "predict() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.predict", false], [44, "arlbench.core.algorithms.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.predict", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.predict", false]], "predict() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.predict", false], [44, "arlbench.core.algorithms.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.predict", false], [45, "arlbench.core.algorithms.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.predict", false]], "predict() (arlbench.core.algorithms.ppo method)": [[13, "arlbench.core.algorithms.PPO.predict", false], [44, "arlbench.core.algorithms.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo method)": [[20, "arlbench.core.algorithms.ppo.PPO.predict", false], [46, "arlbench.core.algorithms.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.predict", false]], "predict() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.predict", false], [44, "arlbench.core.algorithms.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.predict", false], [47, "arlbench.core.algorithms.sac.SAC.predict", false]], "predict() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.predict", false], [47, "arlbench.core.algorithms.sac.sac.SAC.predict", false]], "random search": [[58, "term-Random-Search", true]], "rank (arlbench.autorl.objectives.emissions attribute)": [[42, "arlbench.autorl.objectives.Emissions.RANK", false]], "rank (arlbench.autorl.objectives.objective attribute)": [[42, "arlbench.autorl.objectives.Objective.RANK", false]], "rank (arlbench.autorl.objectives.rewardmean attribute)": [[42, "arlbench.autorl.objectives.RewardMean.RANK", false]], "rank (arlbench.autorl.objectives.rewardstd attribute)": [[42, "arlbench.autorl.objectives.RewardStd.RANK", false]], "rank (arlbench.autorl.objectives.runtime attribute)": [[42, "arlbench.autorl.objectives.Runtime.RANK", false]], "recursive_concat() (in module arlbench.utils)": [[39, "arlbench.utils.recursive_concat", false], [50, "arlbench.utils.recursive_concat", false]], "recursive_concat() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.recursive_concat", false], [50, "arlbench.utils.common.recursive_concat", false]], "replace() (arlbench.core.algorithms.common.timestep method)": [[44, "arlbench.core.algorithms.common.TimeStep.replace", false]], "replace() (arlbench.core.algorithms.dqn.dqn.dqntrainstate method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.replace", false]], "replace() (arlbench.core.algorithms.ppo.ppo.ppotrainstate method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainState.replace", false]], "replace() (arlbench.core.algorithms.sac.sac.sactrainstate method)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainState.replace", false]], "replace() (arlbench.core.running_statistics.nestedmeanstd method)": [[35, "arlbench.core.running_statistics.NestedMeanStd.replace", false], [43, "arlbench.core.running_statistics.NestedMeanStd.replace", false]], "replace() (arlbench.core.running_statistics.runningstatisticsstate method)": [[35, "arlbench.core.running_statistics.RunningStatisticsState.replace", false], [43, "arlbench.core.running_statistics.RunningStatisticsState.replace", false]], "reset() (arlbench.autorl.autorl_env.autorlenv method)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.reset", false]], "reset() (arlbench.autorl.autorlenv method)": [[7, "arlbench.autorl.AutoRLEnv.reset", false], [42, "arlbench.autorl.AutoRLEnv.reset", false]], "reset() (arlbench.autorlenv method)": [[5, "arlbench.AutoRLEnv.reset", false], [41, "arlbench.AutoRLEnv.reset", false]], "reset() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.reset", false], [48, "arlbench.core.environments.autorl_env.Environment.reset", false]], "reset() (arlbench.core.environments.brax_env.braxenv method)": [[48, "arlbench.core.environments.brax_env.BraxEnv.reset", false]], "reset() (arlbench.core.environments.braxenv method)": [[48, "arlbench.core.environments.BraxEnv.reset", false]], "reset() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.reset", false], [48, "arlbench.core.environments.Environment.reset", false]], "reset() (arlbench.core.environments.envpool_env.envpoolenv method)": [[48, "arlbench.core.environments.envpool_env.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.envpoolenv method)": [[48, "arlbench.core.environments.EnvpoolEnv.reset", false]], "reset() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnasiumenv method)": [[48, "arlbench.core.environments.GymnasiumEnv.reset", false]], "reset() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[48, "arlbench.core.environments.gymnax_env.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.gymnaxenv method)": [[48, "arlbench.core.environments.GymnaxEnv.reset", false]], "reset() (arlbench.core.environments.xland_env.xlandenv method)": [[48, "arlbench.core.environments.xland_env.XLandEnv.reset", false]], "reset() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.reset", false]], "reset() (arlbench.core.wrappers.flattenobservationwrapper method)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper.reset", false]], "return_buffer (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer", false]], "return_buffer (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.return_buffer_idx", false]], "return_buffer_idx (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.return_buffer_idx", false]], "reward (arlbench.core.algorithms.common.timestep attribute)": [[44, "arlbench.core.algorithms.common.TimeStep.reward", false]], "reward (arlbench.core.algorithms.dqn.dqn.transition attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition.reward", false]], "reward (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.reward", false]], "reward (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.reward", false], [47, "arlbench.core.algorithms.sac.sac.Transition.reward", false]], "rewardmean (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.RewardMean", false], [42, "arlbench.autorl.objectives.RewardMean", false]], "rewardstd (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.RewardStd", false], [42, "arlbench.autorl.objectives.RewardStd", false]], "rng (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sac.sacrunnerstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState.rng", false]], "rng (arlbench.core.algorithms.sac.sacrunnerstate attribute)": [[24, "arlbench.core.algorithms.sac.SACRunnerState.rng", false], [47, "arlbench.core.algorithms.sac.SACRunnerState.rng", false]], "run_arlbench() (in module arlbench)": [[5, "arlbench.run_arlbench", false], [41, "arlbench.run_arlbench", false]], "run_arlbench() (in module arlbench.arlbench)": [[6, "arlbench.arlbench.run_arlbench", false], [41, "arlbench.arlbench.run_arlbench", false]], "runner_state (arlbench.core.algorithms.dqn.dqn.dqnstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.dqn.dqnstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNState.runner_state", false], [45, "arlbench.core.algorithms.dqn.DQNState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppo.ppostate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.ppo.ppostate attribute)": [[20, "arlbench.core.algorithms.ppo.PPOState.runner_state", false], [46, "arlbench.core.algorithms.ppo.PPOState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sac.sacstate attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false], [47, "arlbench.core.algorithms.sac.sac.SACState.runner_state", false]], "runner_state (arlbench.core.algorithms.sac.sacstate attribute)": [[24, "arlbench.core.algorithms.sac.SACState.runner_state", false], [47, "arlbench.core.algorithms.sac.SACState.runner_state", false]], "runningstatisticsstate (class in arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.RunningStatisticsState", false], [43, "arlbench.core.running_statistics.RunningStatisticsState", false]], "runtime (class in arlbench.autorl.objectives)": [[10, "arlbench.autorl.objectives.Runtime", false], [42, "arlbench.autorl.objectives.Runtime", false]], "sac": [[58, "term-SAC", true]], "sac (class in arlbench.core.algorithms)": [[13, "arlbench.core.algorithms.SAC", false], [44, "arlbench.core.algorithms.SAC", false]], "sac (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SAC", false], [47, "arlbench.core.algorithms.sac.SAC", false]], "sac (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SAC", false], [47, "arlbench.core.algorithms.sac.sac.SAC", false]], "saccnnactor (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACCNNActor", false], [47, "arlbench.core.algorithms.sac.models.SACCNNActor", false]], "saccnncritic (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACCNNCritic", false], [47, "arlbench.core.algorithms.sac.models.SACCNNCritic", false]], "sacmetrics (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACMetrics", false], [47, "arlbench.core.algorithms.sac.SACMetrics", false]], "sacmetrics (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics", false]], "sacmlpactor (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACMLPActor", false], [47, "arlbench.core.algorithms.sac.models.SACMLPActor", false]], "sacmlpcritic (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACMLPCritic", false], [47, "arlbench.core.algorithms.sac.models.SACMLPCritic", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACRunnerState", false], [47, "arlbench.core.algorithms.sac.SACRunnerState", false]], "sacrunnerstate (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACRunnerState", false], [47, "arlbench.core.algorithms.sac.sac.SACRunnerState", false]], "sacstate (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACState", false], [47, "arlbench.core.algorithms.sac.SACState", false]], "sacstate (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACState", false], [47, "arlbench.core.algorithms.sac.sac.SACState", false]], "sactrainingresult (class in arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult", false]], "sactrainingresult (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult", false]], "sactrainreturnt (in module arlbench.core.algorithms.sac)": [[24, "arlbench.core.algorithms.sac.SACTrainReturnT", false], [47, "arlbench.core.algorithms.sac.SACTrainReturnT", false]], "sactrainstate (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainState", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainState", false]], "sacvectorcritic (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.SACVectorCritic", false], [47, "arlbench.core.algorithms.sac.models.SACVectorCritic", false]], "sample_action() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[48, "arlbench.core.environments.gymnax_env.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.gymnaxenv method)": [[48, "arlbench.core.environments.GymnaxEnv.sample_action", false]], "sample_action() (arlbench.core.environments.xland_env.xlandenv method)": [[48, "arlbench.core.environments.xland_env.XLandEnv.sample_action", false]], "sample_actions() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.sample_actions", false], [48, "arlbench.core.environments.autorl_env.Environment.sample_actions", false]], "sample_actions() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.sample_actions", false], [48, "arlbench.core.environments.Environment.sample_actions", false]], "save() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.save", false], [42, "arlbench.autorl.checkpointing.Checkpointer.save", false]], "save_buffer() (arlbench.autorl.checkpointing.checkpointer static method)": [[9, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false], [42, "arlbench.autorl.checkpointing.Checkpointer.save_buffer", false]], "save_defaults_to_yaml() (in module arlbench.utils)": [[39, "arlbench.utils.save_defaults_to_yaml", false], [50, "arlbench.utils.save_defaults_to_yaml", false]], "save_defaults_to_yaml() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.save_defaults_to_yaml", false], [50, "arlbench.utils.common.save_defaults_to_yaml", false]], "scalars_file (arlbench.autorl.checkpointing.checkpointer attribute)": [[42, "arlbench.autorl.checkpointing.Checkpointer.SCALARS_FILE", false]], "scope (arlbench.core.algorithms.dqn.models.cnnq attribute)": [[45, "arlbench.core.algorithms.dqn.models.CNNQ.scope", false]], "scope (arlbench.core.algorithms.dqn.models.mlpq attribute)": [[45, "arlbench.core.algorithms.dqn.models.MLPQ.scope", false]], "scope (arlbench.core.algorithms.ppo.models.cnnactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.scope", false]], "scope (arlbench.core.algorithms.ppo.models.mlpactorcritic attribute)": [[46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.alphacoef attribute)": [[47, "arlbench.core.algorithms.sac.models.AlphaCoef.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnnactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.saccnncritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACCNNCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpactor attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPActor.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacmlpcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACMLPCritic.scope", false]], "scope (arlbench.core.algorithms.sac.models.sacvectorcritic attribute)": [[47, "arlbench.core.algorithms.sac.models.SACVectorCritic.scope", false]], "setup() (arlbench.core.algorithms.dqn.models.cnnq method)": [[19, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false], [45, "arlbench.core.algorithms.dqn.models.CNNQ.setup", false]], "setup() (arlbench.core.algorithms.dqn.models.mlpq method)": [[19, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false], [45, "arlbench.core.algorithms.dqn.models.MLPQ.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.cnnactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false], [46, "arlbench.core.algorithms.ppo.models.CNNActorCritic.setup", false]], "setup() (arlbench.core.algorithms.ppo.models.mlpactorcritic method)": [[21, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false], [46, "arlbench.core.algorithms.ppo.models.MLPActorCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.alphacoef method)": [[25, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false], [47, "arlbench.core.algorithms.sac.models.AlphaCoef.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnnactor method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false], [47, "arlbench.core.algorithms.sac.models.SACCNNActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.saccnncritic method)": [[25, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false], [47, "arlbench.core.algorithms.sac.models.SACCNNCritic.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpactor method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false], [47, "arlbench.core.algorithms.sac.models.SACMLPActor.setup", false]], "setup() (arlbench.core.algorithms.sac.models.sacmlpcritic method)": [[25, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false], [47, "arlbench.core.algorithms.sac.models.SACMLPCritic.setup", false]], "statefeature (class in arlbench.autorl.state_features)": [[11, "arlbench.autorl.state_features.StateFeature", false], [42, "arlbench.autorl.state_features.StateFeature", false]], "std (arlbench.core.running_statistics.nestedmeanstd attribute)": [[43, "arlbench.core.running_statistics.NestedMeanStd.std", false]], "step() (arlbench.autorl.autorl_env.autorlenv method)": [[8, "arlbench.autorl.autorl_env.AutoRLEnv.step", false], [42, "arlbench.autorl.autorl_env.AutoRLEnv.step", false]], "step() (arlbench.autorl.autorlenv method)": [[7, "arlbench.autorl.AutoRLEnv.step", false], [42, "arlbench.autorl.AutoRLEnv.step", false]], "step() (arlbench.autorlenv method)": [[5, "arlbench.AutoRLEnv.step", false], [41, "arlbench.AutoRLEnv.step", false]], "step() (arlbench.core.environments.autorl_env.environment method)": [[28, "arlbench.core.environments.autorl_env.Environment.step", false], [48, "arlbench.core.environments.autorl_env.Environment.step", false]], "step() (arlbench.core.environments.brax_env.braxenv method)": [[48, "arlbench.core.environments.brax_env.BraxEnv.step", false]], "step() (arlbench.core.environments.braxenv method)": [[48, "arlbench.core.environments.BraxEnv.step", false]], "step() (arlbench.core.environments.environment method)": [[27, "arlbench.core.environments.Environment.step", false], [48, "arlbench.core.environments.Environment.step", false]], "step() (arlbench.core.environments.envpool_env.envpoolenv method)": [[48, "arlbench.core.environments.envpool_env.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.envpoolenv method)": [[48, "arlbench.core.environments.EnvpoolEnv.step", false]], "step() (arlbench.core.environments.gymnasium_env.gymnasiumenv method)": [[48, "arlbench.core.environments.gymnasium_env.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnasiumenv method)": [[48, "arlbench.core.environments.GymnasiumEnv.step", false]], "step() (arlbench.core.environments.gymnax_env.gymnaxenv method)": [[48, "arlbench.core.environments.gymnax_env.GymnaxEnv.step", false]], "step() (arlbench.core.environments.gymnaxenv method)": [[48, "arlbench.core.environments.GymnaxEnv.step", false]], "step() (arlbench.core.environments.xland_env.xlandenv method)": [[48, "arlbench.core.environments.xland_env.XLandEnv.step", false]], "step() (arlbench.core.wrappers.flatten_observation.flattenobservationwrapper method)": [[37, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false], [49, "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper.step", false]], "step() (arlbench.core.wrappers.flattenobservationwrapper method)": [[36, "arlbench.core.wrappers.FlattenObservationWrapper.step", false], [49, "arlbench.core.wrappers.FlattenObservationWrapper.step", false]], "summed_variance (arlbench.core.running_statistics.runningstatisticsstate attribute)": [[43, "arlbench.core.running_statistics.RunningStatisticsState.summed_variance", false]], "tanhtransformeddistribution (class in arlbench.core.algorithms.sac.models)": [[25, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false], [47, "arlbench.core.algorithms.sac.models.TanhTransformedDistribution", false]], "target_params (arlbench.core.algorithms.dqn.dqn.dqntrainstate attribute)": [[45, "arlbench.core.algorithms.dqn.dqn.DQNTrainState.target_params", false]], "target_params (arlbench.core.algorithms.sac.sac.sactrainstate attribute)": [[47, "arlbench.core.algorithms.sac.sac.SACTrainState.target_params", false]], "td_error (arlbench.core.algorithms.dqn.dqn.dqnmetrics attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.dqn.dqnmetrics attribute)": [[17, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false], [45, "arlbench.core.algorithms.dqn.DQNMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sac.sacmetrics attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false], [47, "arlbench.core.algorithms.sac.sac.SACMetrics.td_error", false]], "td_error (arlbench.core.algorithms.sac.sacmetrics attribute)": [[24, "arlbench.core.algorithms.sac.SACMetrics.td_error", false], [47, "arlbench.core.algorithms.sac.SACMetrics.td_error", false]], "timestep (class in arlbench.core.algorithms.common)": [[16, "arlbench.core.algorithms.common.TimeStep", false], [44, "arlbench.core.algorithms.common.TimeStep", false]], "to_tuple() (arlbench.core.algorithms.common.timestep method)": [[44, "arlbench.core.algorithms.common.TimeStep.to_tuple", false]], "train() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.train", false], [44, "arlbench.core.algorithms.Algorithm.train", false]], "train() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.train", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.train", false]], "train() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.train", false], [44, "arlbench.core.algorithms.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.train", false], [45, "arlbench.core.algorithms.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.train", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.train", false]], "train() (arlbench.core.algorithms.ppo method)": [[13, "arlbench.core.algorithms.PPO.train", false], [44, "arlbench.core.algorithms.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo method)": [[20, "arlbench.core.algorithms.ppo.PPO.train", false], [46, "arlbench.core.algorithms.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.ppo.ppo.ppo method)": [[22, "arlbench.core.algorithms.ppo.ppo.PPO.train", false], [46, "arlbench.core.algorithms.ppo.ppo.PPO.train", false]], "train() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.train", false], [44, "arlbench.core.algorithms.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.train", false], [47, "arlbench.core.algorithms.sac.SAC.train", false]], "train() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.train", false], [47, "arlbench.core.algorithms.sac.sac.SAC.train", false]], "train_state (arlbench.core.algorithms.dqn.dqn.dqnrunnerstate attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.dqn.dqnrunnerstate attribute)": [[17, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false], [45, "arlbench.core.algorithms.dqn.DQNRunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.ppo.pporunnerstate attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false], [46, "arlbench.core.algorithms.ppo.ppo.PPORunnerState.train_state", false]], "train_state (arlbench.core.algorithms.ppo.pporunnerstate attribute)": [[20, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false], [46, "arlbench.core.algorithms.ppo.PPORunnerState.train_state", false]], "trajectories (arlbench.core.algorithms.dqn.dqn.dqntrainingresult attribute)": [[18, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false], [45, "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.dqn.dqntrainingresult attribute)": [[17, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false], [45, "arlbench.core.algorithms.dqn.DQNTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppo.ppotrainingresult attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false], [46, "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.ppo.ppotrainingresult attribute)": [[20, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false], [46, "arlbench.core.algorithms.ppo.PPOTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sac.sactrainingresult attribute)": [[26, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false], [47, "arlbench.core.algorithms.sac.sac.SACTrainingResult.trajectories", false]], "trajectories (arlbench.core.algorithms.sac.sactrainingresult attribute)": [[24, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false], [47, "arlbench.core.algorithms.sac.SACTrainingResult.trajectories", false]], "transition (class in arlbench.core.algorithms.dqn.dqn)": [[18, "arlbench.core.algorithms.dqn.dqn.Transition", false], [45, "arlbench.core.algorithms.dqn.dqn.Transition", false]], "transition (class in arlbench.core.algorithms.ppo.ppo)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition", false]], "transition (class in arlbench.core.algorithms.sac.sac)": [[26, "arlbench.core.algorithms.sac.sac.Transition", false], [47, "arlbench.core.algorithms.sac.sac.Transition", false]], "tuple_concat() (in module arlbench.utils)": [[39, "arlbench.utils.tuple_concat", false], [50, "arlbench.utils.tuple_concat", false]], "tuple_concat() (in module arlbench.utils.common)": [[40, "arlbench.utils.common.tuple_concat", false], [50, "arlbench.utils.common.tuple_concat", false]], "uniform_sample() (in module arlbench.core.algorithms.buffers)": [[15, "arlbench.core.algorithms.buffers.uniform_sample", false], [44, "arlbench.core.algorithms.buffers.uniform_sample", false]], "update() (arlbench.core.algorithms.dqn method)": [[13, "arlbench.core.algorithms.DQN.update", false], [44, "arlbench.core.algorithms.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn method)": [[17, "arlbench.core.algorithms.dqn.DQN.update", false], [45, "arlbench.core.algorithms.dqn.DQN.update", false]], "update() (arlbench.core.algorithms.dqn.dqn.dqn method)": [[18, "arlbench.core.algorithms.dqn.dqn.DQN.update", false], [45, "arlbench.core.algorithms.dqn.dqn.DQN.update", false]], "update() (in module arlbench.core.running_statistics)": [[35, "arlbench.core.running_statistics.update", false], [43, "arlbench.core.running_statistics.update", false]], "update_actor() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.update_actor", false], [44, "arlbench.core.algorithms.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.update_actor", false], [47, "arlbench.core.algorithms.sac.SAC.update_actor", false]], "update_actor() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false], [47, "arlbench.core.algorithms.sac.sac.SAC.update_actor", false]], "update_alpha() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.update_alpha", false], [44, "arlbench.core.algorithms.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.update_alpha", false], [47, "arlbench.core.algorithms.sac.SAC.update_alpha", false]], "update_alpha() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false], [47, "arlbench.core.algorithms.sac.sac.SAC.update_alpha", false]], "update_critic() (arlbench.core.algorithms.sac method)": [[13, "arlbench.core.algorithms.SAC.update_critic", false], [44, "arlbench.core.algorithms.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac method)": [[24, "arlbench.core.algorithms.sac.SAC.update_critic", false], [47, "arlbench.core.algorithms.sac.SAC.update_critic", false]], "update_critic() (arlbench.core.algorithms.sac.sac.sac method)": [[26, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false], [47, "arlbench.core.algorithms.sac.sac.SAC.update_critic", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm method)": [[13, "arlbench.core.algorithms.Algorithm.update_hpo_config", false], [44, "arlbench.core.algorithms.Algorithm.update_hpo_config", false]], "update_hpo_config() (arlbench.core.algorithms.algorithm.algorithm method)": [[14, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false], [44, "arlbench.core.algorithms.algorithm.Algorithm.update_hpo_config", false]], "value (arlbench.core.algorithms.ppo.ppo.transition attribute)": [[22, "arlbench.core.algorithms.ppo.ppo.Transition.value", false], [46, "arlbench.core.algorithms.ppo.ppo.Transition.value", false]], "value (arlbench.core.algorithms.sac.sac.transition attribute)": [[26, "arlbench.core.algorithms.sac.sac.Transition.value", false], [47, "arlbench.core.algorithms.sac.sac.Transition.value", false]], "values() (arlbench.core.algorithms.common.timestep method)": [[16, "arlbench.core.algorithms.common.TimeStep.values", false], [44, "arlbench.core.algorithms.common.TimeStep.values", false]], "wrapper (class in arlbench.core.wrappers)": [[36, "arlbench.core.wrappers.Wrapper", false], [49, "arlbench.core.wrappers.Wrapper", false]], "wrapper (class in arlbench.core.wrappers.wrapper)": [[38, "arlbench.core.wrappers.wrapper.Wrapper", false], [49, "arlbench.core.wrappers.wrapper.Wrapper", false]], "xlandenv (class in arlbench.core.environments.xland_env)": [[34, "arlbench.core.environments.xland_env.XLandEnv", false], [48, "arlbench.core.environments.xland_env.XLandEnv", false]]}, "objects": {"": [[41, 0, 0, "-", "arlbench"]], "arlbench": [[41, 1, 1, "", "AutoRLEnv"], [41, 0, 0, "-", "arlbench"], [42, 0, 0, "-", "autorl"], [43, 0, 0, "-", "core"], [41, 5, 1, "", "run_arlbench"], [50, 0, 0, "-", "utils"]], "arlbench.AutoRLEnv": [[41, 2, 1, "", "ALGORITHMS"], [41, 3, 1, "", "action_space"], [41, 3, 1, "", "checkpoints"], [41, 3, 1, "", "config"], [41, 3, 1, "", "config_space"], [41, 4, 1, "", "eval"], [41, 3, 1, "", "hpo_config"], [41, 3, 1, "", "objectives"], [41, 3, 1, "", "observation_space"], [41, 4, 1, "", "reset"], [41, 4, 1, "", "step"]], "arlbench.arlbench": [[41, 5, 1, "", "run_arlbench"]], "arlbench.autorl": [[42, 1, 1, "", "AutoRLEnv"], [42, 0, 0, "-", "autorl_env"], [42, 0, 0, "-", "checkpointing"], [42, 0, 0, "-", "objectives"], [42, 0, 0, "-", "state_features"]], "arlbench.autorl.AutoRLEnv": [[42, 2, 1, "", "ALGORITHMS"], [42, 3, 1, "", "action_space"], [42, 3, 1, "", "checkpoints"], [42, 3, 1, "", "config"], [42, 3, 1, "", "config_space"], [42, 4, 1, "", "eval"], [42, 3, 1, "", "hpo_config"], [42, 3, 1, "", "objectives"], [42, 3, 1, "", "observation_space"], [42, 4, 1, "", "reset"], [42, 4, 1, "", "step"]], "arlbench.autorl.autorl_env": [[42, 1, 1, "", "AutoRLEnv"]], "arlbench.autorl.autorl_env.AutoRLEnv": [[42, 2, 1, "", "ALGORITHMS"], [42, 3, 1, "", "action_space"], [42, 3, 1, "", "checkpoints"], [42, 3, 1, "", "config"], [42, 3, 1, "", "config_space"], [42, 4, 1, "", "eval"], [42, 3, 1, "", "hpo_config"], [42, 3, 1, "", "objectives"], [42, 3, 1, "", "observation_space"], [42, 4, 1, "", "reset"], [42, 4, 1, "", "step"]], "arlbench.autorl.checkpointing": [[42, 1, 1, "", "Checkpointer"]], "arlbench.autorl.checkpointing.Checkpointer": [[42, 2, 1, "", "MRP_FILE"], [42, 2, 1, "", "NODES_FILE"], [42, 2, 1, "", "SCALARS_FILE"], [42, 4, 1, "", "load"], [42, 4, 1, "", "load_buffer"], [42, 4, 1, "", "save"], [42, 4, 1, "", "save_buffer"]], "arlbench.autorl.objectives": [[42, 1, 1, "", "Emissions"], [42, 1, 1, "", "Objective"], [42, 1, 1, "", "RewardMean"], [42, 1, 1, "", "RewardStd"], [42, 1, 1, "", "Runtime"]], "arlbench.autorl.objectives.Emissions": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Objective": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "__lt__"], [42, 4, 1, "", "__new__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardMean": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.RewardStd": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.objectives.Runtime": [[42, 2, 1, "", "KEY"], [42, 2, 1, "", "RANK"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_spec"]], "arlbench.autorl.state_features": [[42, 1, 1, "", "GradInfo"], [42, 1, 1, "", "StateFeature"]], "arlbench.autorl.state_features.GradInfo": [[42, 2, 1, "", "KEY"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "get_state_space"]], "arlbench.autorl.state_features.StateFeature": [[42, 2, 1, "", "KEY"], [42, 4, 1, "", "__call__"], [42, 4, 1, "", "__new__"], [42, 4, 1, "", "get_state_space"]], "arlbench.core": [[44, 0, 0, "-", "algorithms"], [48, 0, 0, "-", "environments"], [43, 0, 0, "-", "running_statistics"], [49, 0, 0, "-", "wrappers"]], "arlbench.core.algorithms": [[44, 1, 1, "", "Algorithm"], [44, 1, 1, "", "DQN"], [44, 1, 1, "", "PPO"], [44, 1, 1, "", "SAC"], [44, 0, 0, "-", "algorithm"], [44, 0, 0, "-", "buffers"], [44, 0, 0, "-", "common"], [45, 0, 0, "-", "dqn"], [46, 0, 0, "-", "ppo"], [44, 0, 0, "-", "prioritised_item_buffer"], [47, 0, 0, "-", "sac"]], "arlbench.core.algorithms.Algorithm": [[44, 3, 1, "", "action_type"], [44, 4, 1, "", "eval"], [44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.DQN": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update"]], "arlbench.core.algorithms.PPO": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"]], "arlbench.core.algorithms.SAC": [[44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_actor"], [44, 4, 1, "", "update_alpha"], [44, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.algorithm": [[44, 1, 1, "", "Algorithm"]], "arlbench.core.algorithms.algorithm.Algorithm": [[44, 3, 1, "", "action_type"], [44, 4, 1, "", "eval"], [44, 4, 1, "", "get_checkpoint_factory"], [44, 4, 1, "", "get_default_hpo_config"], [44, 4, 1, "", "get_default_nas_config"], [44, 4, 1, "", "get_hpo_config_space"], [44, 4, 1, "", "get_hpo_search_space"], [44, 4, 1, "", "get_nas_config_space"], [44, 4, 1, "", "init"], [44, 2, 1, "", "name"], [44, 4, 1, "", "predict"], [44, 4, 1, "", "train"], [44, 4, 1, "", "update_hpo_config"]], "arlbench.core.algorithms.buffers": [[44, 5, 1, "", "uniform_sample"]], "arlbench.core.algorithms.common": [[44, 1, 1, "", "TimeStep"]], "arlbench.core.algorithms.common.TimeStep": [[44, 2, 1, "", "action"], [44, 2, 1, "", "done"], [44, 4, 1, "", "from_tuple"], [44, 4, 1, "", "items"], [44, 4, 1, "", "keys"], [44, 2, 1, "", "last_obs"], [44, 2, 1, "", "obs"], [44, 4, 1, "", "replace"], [44, 2, 1, "", "reward"], [44, 4, 1, "", "to_tuple"], [44, 4, 1, "", "values"]], "arlbench.core.algorithms.dqn": [[45, 1, 1, "", "DQN"], [45, 1, 1, "", "DQNMetrics"], [45, 1, 1, "", "DQNRunnerState"], [45, 1, 1, "", "DQNState"], [45, 2, 1, "", "DQNTrainReturnT"], [45, 1, 1, "", "DQNTrainingResult"], [45, 0, 0, "-", "dqn"], [45, 0, 0, "-", "models"]], "arlbench.core.algorithms.dqn.DQN": [[45, 4, 1, "", "get_checkpoint_factory"], [45, 4, 1, "", "get_default_hpo_config"], [45, 4, 1, "", "get_default_nas_config"], [45, 4, 1, "", "get_hpo_config_space"], [45, 4, 1, "", "get_hpo_search_space"], [45, 4, 1, "", "get_nas_config_space"], [45, 4, 1, "", "init"], [45, 2, 1, "", "name"], [45, 4, 1, "", "predict"], [45, 4, 1, "", "train"], [45, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.DQNMetrics": [[45, 2, 1, "", "grads"], [45, 2, 1, "", "loss"], [45, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.DQNRunnerState": [[45, 2, 1, "", "env_state"], [45, 2, 1, "", "global_step"], [45, 2, 1, "", "normalizer_state"], [45, 2, 1, "", "obs"], [45, 2, 1, "", "rng"], [45, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.DQNState": [[45, 2, 1, "", "buffer_state"], [45, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.DQNTrainingResult": [[45, 2, 1, "", "eval_rewards"], [45, 2, 1, "", "metrics"], [45, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn": [[45, 1, 1, "", "DQN"], [45, 1, 1, "", "DQNMetrics"], [45, 1, 1, "", "DQNRunnerState"], [45, 1, 1, "", "DQNState"], [45, 1, 1, "", "DQNTrainState"], [45, 1, 1, "", "DQNTrainingResult"], [45, 1, 1, "", "Transition"]], "arlbench.core.algorithms.dqn.dqn.DQN": [[45, 4, 1, "", "get_checkpoint_factory"], [45, 4, 1, "", "get_default_hpo_config"], [45, 4, 1, "", "get_default_nas_config"], [45, 4, 1, "", "get_hpo_config_space"], [45, 4, 1, "", "get_hpo_search_space"], [45, 4, 1, "", "get_nas_config_space"], [45, 4, 1, "", "init"], [45, 2, 1, "", "name"], [45, 4, 1, "", "predict"], [45, 4, 1, "", "train"], [45, 4, 1, "", "update"]], "arlbench.core.algorithms.dqn.dqn.DQNMetrics": [[45, 2, 1, "", "grads"], [45, 2, 1, "", "loss"], [45, 2, 1, "", "td_error"]], "arlbench.core.algorithms.dqn.dqn.DQNRunnerState": [[45, 2, 1, "", "env_state"], [45, 2, 1, "", "global_step"], [45, 2, 1, "", "normalizer_state"], [45, 2, 1, "", "obs"], [45, 2, 1, "", "rng"], [45, 2, 1, "", "train_state"]], "arlbench.core.algorithms.dqn.dqn.DQNState": [[45, 2, 1, "", "buffer_state"], [45, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainState": [[45, 4, 1, "", "create_with_opt_state"], [45, 2, 1, "", "opt_state"], [45, 4, 1, "", "replace"], [45, 2, 1, "", "target_params"]], "arlbench.core.algorithms.dqn.dqn.DQNTrainingResult": [[45, 2, 1, "", "eval_rewards"], [45, 2, 1, "", "metrics"], [45, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.dqn.dqn.Transition": [[45, 2, 1, "", "action"], [45, 2, 1, "", "done"], [45, 2, 1, "", "info"], [45, 2, 1, "", "obs"], [45, 2, 1, "", "reward"]], "arlbench.core.algorithms.dqn.models": [[45, 1, 1, "", "CNNQ"], [45, 1, 1, "", "MLPQ"]], "arlbench.core.algorithms.dqn.models.CNNQ": [[45, 4, 1, "", "__call__"], [45, 2, 1, "", "action_dim"], [45, 2, 1, "", "activation"], [45, 2, 1, "", "discrete"], [45, 2, 1, "", "hidden_size"], [45, 2, 1, "", "name"], [45, 2, 1, "", "parent"], [45, 2, 1, "", "scope"], [45, 4, 1, "", "setup"]], "arlbench.core.algorithms.dqn.models.MLPQ": [[45, 4, 1, "", "__call__"], [45, 2, 1, "", "action_dim"], [45, 2, 1, "", "activation"], [45, 2, 1, "", "discrete"], [45, 2, 1, "", "hidden_size"], [45, 2, 1, "", "name"], [45, 2, 1, "", "parent"], [45, 2, 1, "", "scope"], [45, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo": [[46, 1, 1, "", "PPO"], [46, 1, 1, "", "PPOMetrics"], [46, 1, 1, "", "PPORunnerState"], [46, 1, 1, "", "PPOState"], [46, 2, 1, "", "PPOTrainReturnT"], [46, 1, 1, "", "PPOTrainingResult"], [46, 0, 0, "-", "models"], [46, 0, 0, "-", "ppo"]], "arlbench.core.algorithms.ppo.PPO": [[46, 4, 1, "", "get_checkpoint_factory"], [46, 4, 1, "", "get_default_hpo_config"], [46, 4, 1, "", "get_default_nas_config"], [46, 4, 1, "", "get_hpo_config_space"], [46, 4, 1, "", "get_hpo_search_space"], [46, 4, 1, "", "get_nas_config_space"], [46, 4, 1, "", "init"], [46, 2, 1, "", "name"], [46, 4, 1, "", "predict"], [46, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.PPOMetrics": [[46, 2, 1, "", "advantages"], [46, 2, 1, "", "grads"], [46, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.PPORunnerState": [[46, 2, 1, "", "cur_rewards"], [46, 2, 1, "", "env_state"], [46, 2, 1, "", "global_step"], [46, 2, 1, "", "normalizer_state"], [46, 2, 1, "", "obs"], [46, 2, 1, "", "return_buffer"], [46, 2, 1, "", "return_buffer_idx"], [46, 2, 1, "", "rng"], [46, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.PPOState": [[46, 2, 1, "", "buffer_state"], [46, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.PPOTrainingResult": [[46, 2, 1, "", "eval_rewards"], [46, 2, 1, "", "metrics"], [46, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.models": [[46, 1, 1, "", "CNNActorCritic"], [46, 1, 1, "", "MLPActorCritic"]], "arlbench.core.algorithms.ppo.models.CNNActorCritic": [[46, 4, 1, "", "__call__"], [46, 2, 1, "", "action_dim"], [46, 2, 1, "", "activation"], [46, 2, 1, "", "discrete"], [46, 2, 1, "", "hidden_size"], [46, 2, 1, "", "name"], [46, 2, 1, "", "parent"], [46, 2, 1, "", "scope"], [46, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.models.MLPActorCritic": [[46, 4, 1, "", "__call__"], [46, 2, 1, "", "action_dim"], [46, 2, 1, "", "activation"], [46, 2, 1, "", "discrete"], [46, 2, 1, "", "hidden_size"], [46, 2, 1, "", "name"], [46, 2, 1, "", "parent"], [46, 2, 1, "", "scope"], [46, 4, 1, "", "setup"]], "arlbench.core.algorithms.ppo.ppo": [[46, 1, 1, "", "PPO"], [46, 1, 1, "", "PPOMetrics"], [46, 1, 1, "", "PPORunnerState"], [46, 1, 1, "", "PPOState"], [46, 1, 1, "", "PPOTrainState"], [46, 1, 1, "", "PPOTrainingResult"], [46, 1, 1, "", "Transition"]], "arlbench.core.algorithms.ppo.ppo.PPO": [[46, 4, 1, "", "get_checkpoint_factory"], [46, 4, 1, "", "get_default_hpo_config"], [46, 4, 1, "", "get_default_nas_config"], [46, 4, 1, "", "get_hpo_config_space"], [46, 4, 1, "", "get_hpo_search_space"], [46, 4, 1, "", "get_nas_config_space"], [46, 4, 1, "", "init"], [46, 2, 1, "", "name"], [46, 4, 1, "", "predict"], [46, 4, 1, "", "train"]], "arlbench.core.algorithms.ppo.ppo.PPOMetrics": [[46, 2, 1, "", "advantages"], [46, 2, 1, "", "grads"], [46, 2, 1, "", "loss"]], "arlbench.core.algorithms.ppo.ppo.PPORunnerState": [[46, 2, 1, "", "cur_rewards"], [46, 2, 1, "", "env_state"], [46, 2, 1, "", "global_step"], [46, 2, 1, "", "normalizer_state"], [46, 2, 1, "", "obs"], [46, 2, 1, "", "return_buffer"], [46, 2, 1, "", "return_buffer_idx"], [46, 2, 1, "", "rng"], [46, 2, 1, "", "train_state"]], "arlbench.core.algorithms.ppo.ppo.PPOState": [[46, 2, 1, "", "buffer_state"], [46, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainState": [[46, 4, 1, "", "create_with_opt_state"], [46, 2, 1, "", "opt_state"], [46, 4, 1, "", "replace"]], "arlbench.core.algorithms.ppo.ppo.PPOTrainingResult": [[46, 2, 1, "", "eval_rewards"], [46, 2, 1, "", "metrics"], [46, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.ppo.ppo.Transition": [[46, 2, 1, "", "action"], [46, 2, 1, "", "done"], [46, 2, 1, "", "info"], [46, 2, 1, "", "log_prob"], [46, 2, 1, "", "obs"], [46, 2, 1, "", "reward"], [46, 2, 1, "", "value"]], "arlbench.core.algorithms.prioritised_item_buffer": [[44, 5, 1, "", "create_prioritised_item_buffer"], [44, 5, 1, "", "make_prioritised_item_buffer"]], "arlbench.core.algorithms.sac": [[47, 1, 1, "", "SAC"], [47, 1, 1, "", "SACMetrics"], [47, 1, 1, "", "SACRunnerState"], [47, 1, 1, "", "SACState"], [47, 2, 1, "", "SACTrainReturnT"], [47, 1, 1, "", "SACTrainingResult"], [47, 0, 0, "-", "models"], [47, 0, 0, "-", "sac"]], "arlbench.core.algorithms.sac.SAC": [[47, 4, 1, "", "get_checkpoint_factory"], [47, 4, 1, "", "get_default_hpo_config"], [47, 4, 1, "", "get_default_nas_config"], [47, 4, 1, "", "get_hpo_config_space"], [47, 4, 1, "", "get_hpo_search_space"], [47, 4, 1, "", "get_nas_config_space"], [47, 4, 1, "", "init"], [47, 2, 1, "", "name"], [47, 4, 1, "", "predict"], [47, 4, 1, "", "train"], [47, 4, 1, "", "update_actor"], [47, 4, 1, "", "update_alpha"], [47, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.SACMetrics": [[47, 2, 1, "", "actor_grads"], [47, 2, 1, "", "actor_loss"], [47, 2, 1, "", "alpha_loss"], [47, 2, 1, "", "critic_grads"], [47, 2, 1, "", "critic_loss"], [47, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.SACRunnerState": [[47, 2, 1, "", "actor_train_state"], [47, 2, 1, "", "alpha_train_state"], [47, 2, 1, "", "critic_train_state"], [47, 2, 1, "", "env_state"], [47, 2, 1, "", "global_step"], [47, 2, 1, "", "normalizer_state"], [47, 2, 1, "", "obs"], [47, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.SACState": [[47, 2, 1, "", "buffer_state"], [47, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.SACTrainingResult": [[47, 2, 1, "", "eval_rewards"], [47, 2, 1, "", "metrics"], [47, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.models": [[47, 1, 1, "", "AlphaCoef"], [47, 1, 1, "", "SACCNNActor"], [47, 1, 1, "", "SACCNNCritic"], [47, 1, 1, "", "SACMLPActor"], [47, 1, 1, "", "SACMLPCritic"], [47, 1, 1, "", "SACVectorCritic"], [47, 1, 1, "", "TanhTransformedDistribution"]], "arlbench.core.algorithms.sac.models.AlphaCoef": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "alpha_init"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNActor": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "log_std_max"], [47, 2, 1, "", "log_std_min"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACCNNCritic": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPActor": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "log_std_max"], [47, 2, 1, "", "log_std_min"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACMLPCritic": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"], [47, 4, 1, "", "setup"]], "arlbench.core.algorithms.sac.models.SACVectorCritic": [[47, 4, 1, "", "__call__"], [47, 2, 1, "", "action_dim"], [47, 2, 1, "", "activation"], [47, 2, 1, "", "critic"], [47, 2, 1, "", "hidden_size"], [47, 2, 1, "", "n_critics"], [47, 2, 1, "", "name"], [47, 2, 1, "", "parent"], [47, 2, 1, "", "scope"]], "arlbench.core.algorithms.sac.models.TanhTransformedDistribution": [[47, 4, 1, "", "mode"]], "arlbench.core.algorithms.sac.sac": [[47, 1, 1, "", "SAC"], [47, 1, 1, "", "SACMetrics"], [47, 1, 1, "", "SACRunnerState"], [47, 1, 1, "", "SACState"], [47, 1, 1, "", "SACTrainState"], [47, 1, 1, "", "SACTrainingResult"], [47, 1, 1, "", "Transition"]], "arlbench.core.algorithms.sac.sac.SAC": [[47, 4, 1, "", "get_checkpoint_factory"], [47, 4, 1, "", "get_default_hpo_config"], [47, 4, 1, "", "get_default_nas_config"], [47, 4, 1, "", "get_hpo_config_space"], [47, 4, 1, "", "get_hpo_search_space"], [47, 4, 1, "", "get_nas_config_space"], [47, 4, 1, "", "init"], [47, 2, 1, "", "name"], [47, 4, 1, "", "predict"], [47, 4, 1, "", "train"], [47, 4, 1, "", "update_actor"], [47, 4, 1, "", "update_alpha"], [47, 4, 1, "", "update_critic"]], "arlbench.core.algorithms.sac.sac.SACMetrics": [[47, 2, 1, "", "actor_grads"], [47, 2, 1, "", "actor_loss"], [47, 2, 1, "", "alpha_loss"], [47, 2, 1, "", "critic_grads"], [47, 2, 1, "", "critic_loss"], [47, 2, 1, "", "td_error"]], "arlbench.core.algorithms.sac.sac.SACRunnerState": [[47, 2, 1, "", "actor_train_state"], [47, 2, 1, "", "alpha_train_state"], [47, 2, 1, "", "critic_train_state"], [47, 2, 1, "", "env_state"], [47, 2, 1, "", "global_step"], [47, 2, 1, "", "normalizer_state"], [47, 2, 1, "", "obs"], [47, 2, 1, "", "rng"]], "arlbench.core.algorithms.sac.sac.SACState": [[47, 2, 1, "", "buffer_state"], [47, 2, 1, "", "runner_state"]], "arlbench.core.algorithms.sac.sac.SACTrainState": [[47, 4, 1, "", "create_with_opt_state"], [47, 2, 1, "", "network_state"], [47, 4, 1, "", "replace"], [47, 2, 1, "", "target_params"]], "arlbench.core.algorithms.sac.sac.SACTrainingResult": [[47, 2, 1, "", "eval_rewards"], [47, 2, 1, "", "metrics"], [47, 2, 1, "", "trajectories"]], "arlbench.core.algorithms.sac.sac.Transition": [[47, 2, 1, "", "action"], [47, 2, 1, "", "done"], [47, 2, 1, "", "info"], [47, 2, 1, "", "obs"], [47, 2, 1, "", "reward"], [47, 2, 1, "", "value"]], "arlbench.core.environments": [[48, 1, 1, "", "BraxEnv"], [48, 1, 1, "", "Environment"], [48, 1, 1, "", "EnvpoolEnv"], [48, 1, 1, "", "GymnasiumEnv"], [48, 1, 1, "", "GymnaxEnv"], [48, 0, 0, "-", "autorl_env"], [48, 0, 0, "-", "brax_env"], [48, 0, 0, "-", "envpool_env"], [48, 0, 0, "-", "gymnasium_env"], [48, 0, 0, "-", "gymnax_env"], [48, 5, 1, "", "make_env"], [48, 0, 0, "-", "make_env"], [48, 0, 0, "-", "xland_env"]], "arlbench.core.environments.BraxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.Environment": [[48, 4, 1, "", "action_space"], [48, 3, 1, "", "env_name"], [48, 3, 1, "", "n_envs"], [48, 4, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_actions"], [48, 4, 1, "", "step"]], "arlbench.core.environments.EnvpoolEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.GymnasiumEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.GymnaxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_action"], [48, 4, 1, "", "step"]], "arlbench.core.environments.autorl_env": [[48, 1, 1, "", "Environment"]], "arlbench.core.environments.autorl_env.Environment": [[48, 4, 1, "", "action_space"], [48, 3, 1, "", "env_name"], [48, 3, 1, "", "n_envs"], [48, 4, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_actions"], [48, 4, 1, "", "step"]], "arlbench.core.environments.brax_env": [[48, 1, 1, "", "BraxEnv"]], "arlbench.core.environments.brax_env.BraxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.envpool_env": [[48, 1, 1, "", "EnvpoolEnv"], [48, 5, 1, "", "numpy_to_jax"]], "arlbench.core.environments.envpool_env.EnvpoolEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.gymnasium_env": [[48, 1, 1, "", "GymnasiumEnv"]], "arlbench.core.environments.gymnasium_env.GymnasiumEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "step"]], "arlbench.core.environments.gymnax_env": [[48, 1, 1, "", "GymnaxEnv"]], "arlbench.core.environments.gymnax_env.GymnaxEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_action"], [48, 4, 1, "", "step"]], "arlbench.core.environments.make_env": [[48, 5, 1, "", "make_env"]], "arlbench.core.environments.xland_env": [[48, 1, 1, "", "XLandEnv"]], "arlbench.core.environments.xland_env.XLandEnv": [[48, 3, 1, "", "action_space"], [48, 3, 1, "", "observation_space"], [48, 4, 1, "", "reset"], [48, 4, 1, "", "sample_action"], [48, 4, 1, "", "step"]], "arlbench.core.running_statistics": [[43, 1, 1, "", "NestedMeanStd"], [43, 1, 1, "", "RunningStatisticsState"], [43, 5, 1, "", "denormalize"], [43, 5, 1, "", "init_state"], [43, 5, 1, "", "normalize"], [43, 5, 1, "", "update"]], "arlbench.core.running_statistics.NestedMeanStd": [[43, 2, 1, "", "mean"], [43, 4, 1, "", "replace"], [43, 2, 1, "", "std"]], "arlbench.core.running_statistics.RunningStatisticsState": [[43, 2, 1, "", "count"], [43, 4, 1, "", "replace"], [43, 2, 1, "", "summed_variance"]], "arlbench.core.wrappers": [[49, 1, 1, "", "FlattenObservationWrapper"], [49, 1, 1, "", "Wrapper"], [49, 0, 0, "-", "flatten_observation"], [49, 0, 0, "-", "wrapper"]], "arlbench.core.wrappers.FlattenObservationWrapper": [[49, 3, 1, "", "observation_space"], [49, 4, 1, "", "reset"], [49, 4, 1, "", "step"]], "arlbench.core.wrappers.flatten_observation": [[49, 1, 1, "", "FlattenObservationWrapper"]], "arlbench.core.wrappers.flatten_observation.FlattenObservationWrapper": [[49, 3, 1, "", "observation_space"], [49, 4, 1, "", "reset"], [49, 4, 1, "", "step"]], "arlbench.core.wrappers.wrapper": [[49, 1, 1, "", "Wrapper"]], "arlbench.utils": [[50, 0, 0, "-", "common"], [50, 5, 1, "", "config_space_to_gymnasium_space"], [50, 5, 1, "", "config_space_to_yaml"], [50, 5, 1, "", "gymnasium_space_to_gymnax_space"], [50, 5, 1, "", "recursive_concat"], [50, 5, 1, "", "save_defaults_to_yaml"], [50, 5, 1, "", "tuple_concat"]], "arlbench.utils.common": [[50, 5, 1, "", "config_space_to_gymnasium_space"], [50, 5, 1, "", "config_space_to_yaml"], [50, 5, 1, "", "gymnasium_space_to_gymnax_space"], [50, 5, 1, "", "recursive_concat"], [50, 5, 1, "", "save_defaults_to_yaml"], [50, 5, 1, "", "tuple_concat"]]}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "attribute", "Python attribute"], "3": ["py", "property", "Python property"], "4": ["py", "method", "Python method"], "5": ["py", "function", "Python function"]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:attribute", "3": "py:property", "4": "py:method", "5": "py:function"}, "terms": {"": [5, 6, 13, 14, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 41, 44, 45, 46, 47, 52, 54], "0": [17, 18, 20, 22, 23, 24, 25, 26, 27, 33, 35, 39, 40, 42, 43, 44, 45, 46, 47, 48, 50], "06": [35, 43], "1": [17, 18, 20, 22, 24, 25, 26, 27, 33, 42, 45, 46, 47, 48, 54, 60], "10": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 60], "100": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "1000000": [13, 14, 17, 18, 20, 22, 24, 26, 35, 43, 44, 45, 46, 47], "1e": [35, 43], "2": [17, 18, 20, 22, 24, 25, 26, 35, 42, 43, 45, 46, 47, 60], "20": [25, 47, 51], "24": [35, 43], "3": [17, 18, 20, 22, 24, 26, 45, 46, 47, 60], "31": [35, 43], "4": [17, 18, 20, 22, 24, 26, 45, 46, 47], "5": [17, 18, 20, 22, 24, 26, 45, 46, 47], "512": [19, 21, 25, 45, 46, 47], "6": [20, 22, 23, 24, 26, 44, 46, 47], "64": [19, 21, 25, 45, 46, 47], "64bit": [35, 43], "7": [20, 22, 24, 26, 46, 47], "8": [20, 22, 46], "A": [16, 19, 21, 25, 27, 29, 31, 32, 34, 35, 43, 44, 45, 46, 47, 48, 54, 58], "As": [20, 22, 27, 28, 46, 48], "For": 51, "If": [5, 7, 8, 23, 35, 41, 42, 43, 44, 52, 60], "In": [0, 5, 7, 8, 41, 42, 52], "It": [10, 11, 42, 57], "Not": [13, 17, 18, 24, 26, 44, 45, 47], "The": [9, 13, 14, 19, 21, 23, 25, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 39, 40, 42, 43, 44, 45, 46, 47, 48, 49, 50, 52, 53, 54, 57, 58, 60], "Then": 60, "There": 60, "These": [27, 28, 48, 51, 53, 54], "To": [35, 43], "With": [5, 7, 8, 41, 42], "_": [13, 20, 22, 24, 26, 44, 46, 47, 48], "__call__": [10, 11, 19, 21, 25, 41, 42, 44, 45, 46, 47], "__init__": [19, 21, 25, 45, 46, 47], "__lt__": [10, 41, 42], "__new__": [10, 11, 41, 42], "__setattr__": [19, 21, 25, 45, 46, 47], "_description_": [5, 7, 8, 13, 24, 26, 27, 28, 33, 39, 40, 41, 42, 44, 47, 48, 50], "_imag": [35, 43], "_sentinel": [19, 21, 25, 45, 46, 47], "_type_": [39, 40, 50], "abc": [10, 11, 13, 14, 27, 28, 42, 44, 48], "abstract": [10, 11, 13, 14, 27, 28, 42, 44, 48], "access": [19, 21, 25, 45, 46, 47], "accumul": [35, 43], "acm": [35, 43], "across": [20, 22, 46, 53], "act": [23, 44], "action": [5, 7, 8, 13, 14, 16, 17, 18, 20, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49], "action_dim": [19, 21, 25, 44, 45, 46, 47], "action_s": [13, 14, 44], "action_spac": [5, 7, 8, 27, 28, 29, 30, 31, 32, 34, 41, 42, 43, 48, 61], "action_typ": [13, 14, 43, 44], "activ": [19, 21, 25, 44, 45, 46, 47, 60], "actor": [13, 21, 24, 25, 26, 44, 46, 47, 58], "actor_grad": [24, 26, 44, 47], "actor_loss": [13, 24, 26, 44, 47], "actor_network_param": [13, 24, 26, 44, 47], "actor_opt_st": [13, 24, 26, 44, 47], "actor_train_st": [13, 24, 26, 44, 47], "actual": [27, 28, 48, 52, 57], "ad": [23, 44], "adapt": [13, 14, 15, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "add": [23, 44], "add_batch": [23, 44], "add_sequ": [23, 44], "addit": [0, 5, 7, 8, 41, 42, 54], "advantag": [10, 11, 20, 22, 42, 44, 46], "after": [35, 43], "agent": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 54], "algorithm": [0, 5, 7, 8, 9, 27, 28, 39, 40, 41, 42, 43, 48, 50, 51, 52, 54, 55, 58, 61], "algorithm_kw_arg": [9, 42], "algorithm_st": [9, 13, 14, 42, 44], "algorithmst": [9, 42], "alia": [17, 18, 20, 22, 24, 26, 45, 46, 47], "all": [9, 13, 14, 17, 18, 20, 22, 24, 26, 35, 42, 43, 44, 45, 46, 47, 52], "allow": [10, 11, 42, 51, 53], "alongsid": 52, "alpha": [13, 23, 24, 25, 26, 44, 47], "alpha_init": [25, 44, 47], "alpha_loss": [13, 24, 26, 44, 47], "alpha_network_param": [13, 24, 26, 44, 47], "alpha_opt_st": [13, 24, 26, 44, 47], "alpha_train_st": [13, 24, 26, 44, 47], "alphacoef": [25, 44, 47], "also": [0, 57], "alwai": [20, 22, 46, 57], "among": [13, 14, 44], "an": [9, 10, 11, 16, 19, 21, 23, 25, 27, 28, 30, 35, 42, 43, 44, 45, 46, 47, 48, 52, 58], "analyz": 51, "ani": [9, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 33, 35, 36, 37, 42, 43, 44, 45, 46, 47, 48, 49], "anoth": [19, 21, 25, 45, 46, 47], "append": [9, 42], "appli": [19, 21, 25, 45, 46, 47, 58], "apply_fn": [18, 22, 26, 45, 46, 47], "approxim": 58, "ar": [9, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 35, 36, 37, 42, 43, 44, 45, 46, 47, 49, 51, 53, 54, 57, 60], "architectur": [13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 44, 45, 46, 47, 50, 54], "arg": [10, 11, 25, 42, 47], "argument": [27, 33, 48, 54], "arlbench": [52, 57, 60], "arlbenchmark": 52, "around": [10, 11, 42], "arrai": [5, 7, 8, 17, 18, 20, 22, 24, 25, 26, 27, 28, 30, 35, 41, 42, 43, 44, 45, 46, 47, 48], "aspect": 52, "assign": [19, 21, 25, 45, 46, 47], "attribut": [9, 19, 21, 25, 42, 45, 46, 47], "autom": [5, 7, 8, 41, 42, 58], "automl": [58, 60], "autorl": [5, 41, 51, 53, 54, 55, 58, 61], "autorl_config": [9, 42], "autorl_env": [41, 43, 61], "autorlenv": [5, 7, 8, 41, 42, 61], "avail": [51, 53, 54], "axi": [35, 39, 40, 43, 50], "base": [5, 7, 8, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 46, 47, 48, 49], "baselines3": [21, 25, 46, 47], "basi": 52, "basic": [10, 11, 13, 14, 42, 44], "batch": [13, 15, 17, 18, 23, 24, 26, 35, 43, 44, 45, 47], "batch_siz": [15, 44], "bayesian": 58, "befor": [5, 7, 8, 19, 21, 25, 35, 41, 42, 43, 45, 46, 47], "behavior": [51, 54], "behaviour": [10, 11, 42], "being": [19, 21, 23, 25, 44, 45, 46, 47], "benchmark": [51, 54], "best": [52, 58, 60], "between": [10, 15, 42, 44], "black": [52, 58], "blob": [21, 25, 35, 43, 46, 47], "bo": 58, "bool": [5, 7, 8, 9, 10, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 35, 41, 42, 43, 44, 45, 46, 47, 48], "bool_": [20, 22, 24, 26, 44, 46, 47, 48], "both": [27, 28, 48, 55], "bound": [19, 21, 25, 45, 46, 47], "box": [36, 37, 49, 52, 58], "branch": 57, "brax": [27, 29, 33, 48, 54], "brax_env": [41, 43], "braxenv": [27, 29, 43, 48], "buffer": [9, 13, 14, 17, 18, 20, 22, 23, 41, 42, 43, 45, 46], "buffer_dir": [9, 42], "buffer_st": [9, 13, 14, 17, 18, 20, 22, 24, 26, 42, 44, 45, 46, 47], "c_episod": [9, 42], "c_step": [9, 42], "calcul": [10, 11, 25, 42, 47], "call": [5, 7, 8, 10, 11, 19, 21, 23, 25, 36, 37, 41, 42, 44, 45, 46, 47, 49], "callabl": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "can": [10, 11, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 42, 44, 45, 46, 47, 52, 54, 57, 58, 60], "captur": [16, 44], "carbon": [10, 42], "case": [19, 21, 25, 45, 46, 47, 52], "caus": [19, 21, 25, 45, 46, 47], "caution": 57, "cd": 60, "certain": [9, 42], "cfg": [5, 6, 41], "checkpoint": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 44, 45, 46, 47, 54, 61], "checkpoint_dir": [9, 42, 54], "checkpoint_nam": [9, 42, 54], "checkpoint_path": [5, 7, 8, 9, 41, 42], "chex": [13, 14, 15, 17, 18, 20, 22, 24, 26, 36, 37, 44, 45, 46, 47, 49], "choos": 52, "chosen": [23, 44], "cl": [10, 11, 42], "class": [5, 7, 8, 9, 10, 11, 13, 14, 16, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 41, 42, 43, 44, 45, 46, 47, 48, 49], "classmethod": [45, 46, 47], "clear": 57, "clearli": 57, "clip": 58, "clone": 60, "cnn": [19, 21, 25, 45, 46, 47, 54], "cnn_polici": [13, 17, 18, 20, 22, 24, 26, 27, 33, 34, 44, 45, 46, 47, 48, 54], "cnnactorcrit": [21, 44, 46], "cnnq": [19, 44, 45], "co2": 53, "code": [10, 42, 57], "coeffici": [25, 47], "com": [21, 25, 35, 43, 46, 47, 60], "command": 60, "common": [9, 21, 25, 41, 42, 43, 46, 47, 61], "common_gotchas_in_jax": [35, 43], "compact": [19, 21, 25, 45, 46, 47], "compar": [10, 42], "comparison": [10, 42, 57], "compat": [27, 33, 48], "comput": [35, 43], "concat": [39, 40, 50], "concaten": [39, 40, 50], "conda": 60, "config": [5, 6, 7, 8, 41, 42, 61], "config_kei": [39, 40, 50], "config_spac": [5, 7, 8, 39, 40, 41, 42, 50, 61], "config_space_to_gymnasium_spac": [39, 40, 41, 50], "config_space_to_yaml": [39, 40, 41, 50], "configspac": [5, 7, 8, 39, 40, 41, 42, 50], "configur": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 41, 42, 44, 45, 46, 47, 50, 52, 53, 54], "configurationspac": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 41, 42, 44, 45, 46, 47, 50], "consid": [35, 43], "consist": [17, 18, 20, 22, 24, 26, 45, 46, 47], "construct": [3, 19, 21, 25, 45, 46, 47], "contain": [9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 35, 42, 43, 44, 45, 46, 47, 48, 54], "content": 61, "conv": [19, 21, 25, 45, 46, 47], "conv1": [19, 21, 25, 45, 46, 47], "converst": [39, 40, 50], "convert": [30, 39, 40, 48, 50], "core": [41, 42, 61], "correctli": 57, "correspond": [35, 43], "count": [35, 41, 43], "cover": 51, "cpu": [23, 44], "creat": [5, 7, 8, 10, 11, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 41, 42, 44, 45, 46, 47, 48, 60], "create_prioritised_item_buff": [23, 43, 44], "create_with_opt_st": [44, 45, 46, 47], "critic": [13, 21, 24, 25, 26, 44, 46, 47, 58], "critic_grad": [24, 26, 44, 47], "critic_loss": [13, 24, 26, 44, 47], "critic_network_param": [13, 24, 26, 44, 47], "critic_opt_st": [13, 24, 26, 44, 47], "critic_target_param": [13, 24, 26, 44, 47], "critic_train_st": [13, 24, 26, 44, 47], "cumul": [13, 14, 44], "cur_reward": [20, 22, 44, 46], "current": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 52, 54], "d": [16, 44, 53], "data": [9, 23, 35, 42, 43, 44, 51], "decid": [52, 54], "deep": [13, 17, 18, 44, 45, 58], "deepmind": [35, 43], "def": [19, 21, 25, 45, 46, 47], "default": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 35, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50], "defin": [13, 14, 19, 21, 25, 44, 45, 46, 47, 52, 57], "degrad": [35, 43], "denorm": [35, 41, 43], "depend": [23, 35, 43, 44], "determinist": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 54], "deterministic_ev": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 54], "deviat": [10, 35, 42, 43, 52, 53], "devic": [23, 44], "diabl": 54, "dict": [5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 27, 33, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50], "dict1": [39, 40, 50], "dict2": [39, 40, 50], "dictionari": [9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 42, 44, 45, 46, 47, 50], "differ": [0, 13, 14, 44, 52, 57, 58], "dimens": [35, 43], "directli": [10, 11, 42], "directori": [9, 42, 54], "discret": [13, 14, 19, 21, 44, 45, 46], "discuss": 52, "disk": [9, 42], "distrax": [25, 47], "distribut": [25, 47], "dlr": [21, 25, 46, 47], "do": [10, 11, 42, 57], "doc": [35, 43], "document": 52, "doe": [19, 20, 21, 22, 25, 45, 46, 47], "doesn": [35, 43], "dolor": 59, "done": [9, 10, 11, 13, 16, 17, 18, 22, 26, 42, 43, 44, 45, 46, 47, 51, 58, 60], "doubl": [35, 43], "download": 60, "dqn": [13, 24, 26, 41, 42, 43, 44, 47, 51, 52, 54, 58], "dqnmetric": [17, 18, 44, 45], "dqnrunnerst": [13, 17, 18, 44, 45], "dqnstate": [13, 17, 18, 44, 45], "dqntrainingresult": [13, 17, 18, 44, 45], "dqntrainreturnt": [13, 17, 18, 44, 45], "dqntrainstat": [13, 17, 18, 44, 45], "dtype": [35, 43], "dummi": [9, 42], "dummy_buffer_st": [9, 42], "dure": [5, 7, 8, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "dynam": [35, 43], "e": 53, "each": [5, 7, 8, 23, 27, 28, 41, 42, 44, 48, 54], "earlier": [35, 43], "effici": 51, "either": [19, 21, 25, 45, 46, 47, 60], "element": [35, 39, 40, 43, 50, 54], "emiss": [10, 41, 42, 53, 54], "empti": [5, 7, 8, 41, 42], "en": [35, 43], "enabl": [35, 43, 57], "ensur": 51, "entropi": [13, 24, 26, 44, 47, 58], "env": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 38, 41, 42, 44, 45, 46, 47, 48, 49], "env_framework": [27, 33, 48, 54], "env_kwarg": [27, 29, 30, 31, 32, 33, 34, 48, 54], "env_nam": [27, 28, 29, 30, 31, 32, 33, 34, 43, 48, 54], "env_stat": [17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49], "environ": [5, 7, 8, 9, 10, 11, 13, 14, 16, 36, 37, 41, 42, 43, 44, 49, 51, 52, 53, 54, 57, 58, 60], "envpool": [27, 30, 33, 48, 54, 60], "envpool_env": [41, 43], "envpoolenv": [27, 30, 43, 48], "episod": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 53, 54], "equival": [23, 27, 33, 35, 43, 44, 48], "error": [5, 7, 8, 41, 42], "etc": [27, 33, 35, 43, 48], "eval": [5, 7, 8, 13, 14, 41, 42, 43, 44, 61], "eval_env": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "eval_env_kwarg": 54, "eval_reward": [17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "evalu": [5, 7, 8, 10, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 52, 53, 54], "evalut": [5, 7, 8, 41, 42], "even": [35, 43], "exact": 51, "exisit": 57, "experi": [13, 15, 24, 26, 44, 47, 51, 52, 57], "exploit": 58, "explor": [54, 58], "expon": [23, 44], "extract": [39, 40, 50], "facilit": 57, "factori": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "fals": [13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 34, 44, 45, 46, 47, 48], "featur": [5, 7, 8, 11, 41, 42, 54], "fidel": 58, "field": [17, 18, 20, 22, 24, 26, 35, 43, 45, 46, 47], "file": [35, 39, 40, 43, 50, 54], "final": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "find": [57, 58], "first": [10, 11, 39, 40, 42, 50, 60], "fit": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "flatten": [36, 37, 49], "flatten_observ": [41, 43], "flattenobservationwrapp": [36, 37, 43, 49], "flax": [19, 21, 25, 45, 46, 47], "float": [5, 6, 23, 35, 41, 43, 44, 47], "float32": [35, 43], "focu": 51, "focus": 52, "follow": [19, 21, 25, 27, 28, 33, 45, 46, 47, 48, 53, 60], "found": [52, 54, 57], "framework": [27, 33, 48, 54, 57], "free": 57, "from": [9, 35, 42, 43, 52, 58, 60], "from_tupl": [43, 44], "frozendict": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "full": [35, 43], "fulli": [27, 28, 48], "function": [6, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 30, 35, 36, 37, 40, 42, 43, 44, 45, 46, 47, 48, 49, 58], "g": 53, "gener": [13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49, 51, 54], "get_checkpoint_factori": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_default_hpo_config": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_default_nas_config": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_hpo_config_spac": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_hpo_search_spac": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_nas_config_spac": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "get_spec": [10, 41, 42], "get_state_spac": [11, 41, 42], "git": 60, "github": [21, 25, 35, 43, 46, 47, 60], "give": [19, 21, 25, 45, 46, 47], "given": [5, 6, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 35, 36, 37, 41, 43, 44, 45, 46, 47, 48, 49, 54, 58], "global_step": [17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "good": 52, "gpu": [23, 44], "grad": [11, 13, 17, 18, 20, 22, 42, 44, 45, 46], "grad_info": 42, "gradient": [11, 42, 58], "gradinfo": [11, 41, 42], "gymnasium": [5, 7, 8, 27, 28, 31, 33, 39, 40, 41, 42, 48, 50, 57], "gymnasium_env": [41, 43], "gymnasium_space_to_gymnax_spac": [39, 40, 41, 50], "gymnasiumenv": [27, 31, 43, 48], "gymnax": [27, 28, 29, 30, 31, 32, 33, 34, 39, 40, 48, 50, 54], "gymnax_env": [41, 43], "gymnax_spac": [39, 40, 50], "gymnaxenv": [27, 32, 43, 48], "gynasium": [5, 7, 8, 41, 42], "gynmasium": [5, 7, 8, 41, 42], "ha": [27, 33, 48], "happen": [19, 21, 25, 45, 46, 47, 54], "have": [35, 43, 57], "here": [19, 21, 25, 45, 46, 47], "hidden_s": [19, 21, 25, 44, 45, 46, 47], "hierarchi": [35, 43], "high": 54, "how": [2, 51, 52], "howev": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 52, 57], "hp_config": [9, 39, 40, 42, 50, 54], "hp_config_spac": [39, 40, 50], "hpo": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 52, 58], "hpo_config": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 61], "html": [35, 43], "http": [21, 25, 35, 43, 46, 47], "huggingfac": 51, "hyperparamet": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 41, 42, 44, 45, 46, 47, 50, 51, 52, 54, 58], "i": [3, 5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 41, 42, 44, 45, 46, 47, 51, 52, 54, 55, 57, 60], "id": [9, 27, 28, 33, 42, 48], "ideal": 57, "identifi": [9, 42], "imit": [10, 11, 42], "immedi": [19, 21, 25, 45, 46, 47], "impact": [35, 43], "implement": [10, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 42, 44, 45, 46, 47, 48], "import": [52, 55], "improv": [35, 43, 58], "includ": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "independ": [23, 44], "inexact": [35, 43], "info": [18, 22, 26, 44, 45, 46, 47], "inform": [5, 7, 8, 11, 41, 42, 51, 54], "infot": [5, 7, 8, 41, 42], "init": [13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 43, 44, 45, 46, 47], "init_and_output": [19, 21, 25, 45, 46, 47], "init_st": [35, 41, 43], "initi": [5, 7, 8, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 35, 41, 42, 43, 44, 45, 46, 47], "insid": [19, 21, 25, 45, 46, 47], "insight": 0, "instanc": [10, 11, 19, 21, 25, 42, 45, 46, 47], "instead": 60, "int": [5, 7, 8, 9, 13, 14, 15, 17, 18, 20, 22, 23, 24, 26, 27, 28, 33, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50], "int32": [35, 43], "integ": [35, 43], "interact": [16, 44], "intern": [0, 27, 28, 36, 37, 48, 49], "interv": [15, 44, 54], "invok": [19, 21, 25, 45, 46, 47], "io": [35, 43], "ipsum": 59, "is_weight": [13, 17, 18, 24, 26, 44, 45, 47], "item": [16, 23, 43, 44], "iter": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47], "its": [5, 7, 8, 36, 37, 41, 42, 49, 58], "jax": [13, 17, 18, 20, 22, 24, 26, 27, 28, 30, 33, 35, 43, 44, 45, 46, 47, 48], "jax_enable_x64": [35, 43], "jit": [35, 43, 57], "jittabl": [27, 28, 48], "jnp": [13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 35, 36, 37, 43, 44, 45, 46, 47, 48, 49], "json": 42, "just": 60, "keep": [10, 11, 42], "kei": [13, 14, 15, 16, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54], "kept": [20, 22, 46], "keyword": [27, 33, 48, 53, 54], "kind": [27, 28, 48], "know": [9, 42], "kwarg": [10, 11, 25, 42, 44, 45, 46, 47], "l48": [21, 25, 46, 47], "landscap": 51, "larg": [35, 43], "last": [9, 10, 42], "last_ob": [16, 43, 44], "latest": [35, 43, 60], "lazi": [19, 21, 25, 45, 46, 47], "lazili": [19, 21, 25, 45, 46, 47], "learn": [5, 7, 8, 13, 14, 41, 42, 44, 58], "leav": [35, 43], "length": [15, 23, 44], "less": [10, 42], "level": [5, 41, 54, 55, 58], "like": [5, 7, 8, 16, 19, 21, 25, 41, 42, 44, 45, 46, 47, 53, 60], "line": [19, 21, 25, 45, 46, 47], "linen": [19, 21, 25, 45, 46, 47], "linux": 60, "list": [5, 6, 7, 8, 41, 42, 53, 54], "load": [9, 41, 42], "load_buff": [9, 41, 42], "log_prob": [22, 44, 46], "log_std_max": [25, 44, 47], "log_std_min": [25, 44, 47], "logger": [5, 6, 41], "lorem": 59, "loss": [13, 17, 18, 20, 22, 44, 45, 46], "low": 54, "lower": 54, "machin": 58, "make": [23, 44, 60], "make_env": [27, 41, 43], "make_prioritised_item_buff": [23, 43, 44], "mani": 57, "map": [16, 44], "master": [21, 25, 35, 43, 46, 47], "match": [27, 33, 35, 43, 48], "max_abs_valu": [35, 43], "max_length": [23, 44], "max_recorded_prior": 42, "maxim": [10, 42, 54], "maximum": [23, 35, 43, 44, 58], "mean": [10, 35, 41, 42, 43, 53], "mean_std": [35, 43], "measur": [10, 42], "method": [9, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 42, 44, 45, 46, 47, 48, 53, 58], "metric": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "min_length": [23, 44], "minim": [10, 42, 54], "minimum": [23, 35, 43, 44, 58], "mlp": [19, 21, 25, 45, 46, 47], "mlpactorcrit": [21, 44, 46], "mlpq": [19, 44, 45], "mode": [25, 44, 47], "model": [43, 44, 58], "modifi": [35, 43], "modul": [5, 7, 12, 13, 17, 19, 20, 21, 24, 25, 27, 36, 39, 61], "moment": 53, "more": [23, 44, 51, 52, 54], "most": 52, "mrp_file": [41, 42], "multi": 58, "multipl": 58, "must": [27, 33, 35, 43, 48], "mymodul": [19, 21, 25, 45, 46, 47], "n": 60, "n_critic": [25, 44, 47], "n_env": [13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 29, 30, 32, 33, 34, 43, 44, 45, 46, 47, 48, 54], "n_eval_episod": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 54], "n_eval_step": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 54], "n_step": 54, "n_total_timestep": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 54], "name": [9, 19, 21, 25, 27, 28, 33, 35, 39, 40, 42, 43, 44, 45, 46, 47, 48, 50, 54], "namedtupl": [17, 18, 20, 22, 24, 26, 45, 46, 47], "nas_config": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 54], "nas_config_sapc": [39, 40, 50], "naturecnn": [21, 25, 46, 47], "ndarrai": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 35, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49], "need": [27, 28, 48], "nest": [35, 43], "nestedmeanstd": [35, 41, 43], "network": [13, 17, 18, 19, 20, 21, 22, 24, 25, 26, 44, 45, 46, 47, 58], "network_param": [13, 17, 18, 20, 22, 44, 45, 46], "network_st": [44, 47], "neural": [13, 14, 17, 18, 20, 22, 24, 26, 39, 40, 44, 45, 46, 47, 50, 58], "new": [10, 11, 18, 22, 26, 35, 42, 43, 45, 46, 47], "next": [13, 17, 18, 44, 45], "next_observ": [13, 17, 18, 44, 45], "nn": [19, 21, 25, 45, 46, 47], "node": 42, "nodes_fil": [41, 42], "none": [5, 6, 7, 8, 9, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50], "norm": [11, 42], "normal": [35, 41, 43], "normalizer_st": [17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "note": [20, 22, 27, 28, 35, 43, 46, 48], "notebook": [35, 43], "now": [19, 21, 25, 45, 46, 47], "np": [5, 7, 8, 41, 42], "npy": 42, "num_eval_episod": [5, 7, 8, 13, 14, 41, 42, 44], "number": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 33, 36, 37, 41, 42, 44, 45, 46, 47, 48, 49, 53, 54], "numpi": [30, 35, 43, 48], "numpy_to_jax": [30, 43, 48], "ob": [13, 14, 16, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "object": [0, 5, 6, 7, 8, 9, 11, 16, 18, 19, 21, 22, 25, 26, 35, 36, 38, 39, 40, 41, 43, 44, 45, 46, 47, 49, 50, 52, 54, 58, 61], "objectivest": [5, 7, 8, 41, 42], "objectv": [10, 42], "obser": [36, 37, 49], "observ": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 44, 45, 46, 47, 48, 49], "observation_spac": [5, 7, 8, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 43, 48, 49, 61], "observationt": [5, 7, 8, 41, 42], "off": 58, "onc": [19, 21, 25, 45, 46, 47], "one": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 33, 41, 42, 44, 45, 46, 47, 48, 52, 54, 60], "ones": 57, "onli": [20, 22, 35, 43, 46], "oper": [23, 44], "opt_stat": [13, 17, 18, 20, 22, 26, 44, 45, 46, 47], "optax": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "optim": [10, 13, 17, 18, 20, 22, 23, 24, 26, 42, 44, 45, 46, 47, 52, 54, 58], "optimize_object": [10, 42, 54], "option": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50], "optstat": [13, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "org": [35, 43], "other": [1, 10, 13, 17, 18, 19, 20, 21, 22, 24, 25, 26, 42, 44, 45, 46, 47], "our": 51, "overflow": [35, 43], "overrid": [10, 11, 42], "overriden": [9, 42], "overview": 54, "own": [52, 57], "packag": [5, 60, 61], "page": 3, "paper": [23, 44, 51, 57], "parallel": 54, "param": [13, 17, 18, 20, 22, 26, 44, 45, 46, 47], "paramet": [5, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 20, 22, 23, 24, 26, 27, 28, 33, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "parent": [19, 21, 25, 44, 45, 46, 47], "part": [9, 42], "pass": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 33, 35, 41, 42, 43, 44, 45, 46, 47, 48], "path": [5, 7, 8, 9, 41, 42], "per": [5, 7, 8, 13, 14, 17, 18, 20, 22, 23, 24, 26, 41, 42, 44, 45, 46, 47], "perform": [5, 7, 8, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 28, 35, 41, 42, 43, 44, 45, 46, 47, 48], "period": [15, 44], "pip": 60, "place": 54, "pleas": [51, 52, 54], "pmap": [35, 43], "pmap_axis_nam": [35, 43], "png": [35, 43], "point": [35, 43], "polici": [13, 20, 22, 44, 46, 54, 58], "possibl": [13, 14, 44], "possibli": [35, 43], "posssibl": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "ppo": [13, 24, 25, 26, 41, 42, 43, 44, 47, 51, 52, 54, 58], "ppometr": [20, 22, 44, 46], "pporunnerst": [13, 20, 22, 44, 46], "ppostat": [13, 20, 22, 44, 46], "ppotrainingresult": [13, 20, 22, 44, 46], "ppotrainreturnt": [13, 20, 22, 44, 46], "ppotrainst": [20, 22, 44, 46], "pre": 52, "precis": [35, 43], "predefin": 58, "predict": [13, 14, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47], "principl": 58, "prioriti": [9, 23, 42, 44], "prioritis": [23, 44], "prioritised_item_buff": [41, 43], "prioritisedtrajectorybuff": [23, 44], "prioritisedtrajectorybufferst": [9, 13, 15, 17, 18, 24, 26, 42, 44, 45, 47], "priority_expon": [23, 44], "priority_state_path": [9, 42], "prioriz": [15, 44], "prngkei": [13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49], "problem": 58, "proce": 57, "process": [53, 58], "promin": 52, "properti": [5, 7, 8, 13, 14, 27, 28, 29, 30, 31, 32, 34, 36, 37, 41, 42, 44, 48, 49], "propos": 52, "provid": [0, 16, 44, 52, 57], "proxim": [13, 20, 22, 44, 46, 58], "py": [21, 25, 35, 43, 46, 47, 53], "pypi": 60, "python": [53, 60], "q": [13, 17, 18, 19, 44, 45, 58], "question": 52, "rais": [5, 7, 8, 41, 42], "random": [5, 7, 8, 13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 33, 36, 37, 41, 42, 44, 45, 46, 47, 48, 49, 54, 58], "randomli": 58, "rang": [35, 43], "rank": [10, 41, 42], "re": [5, 7, 8, 41, 42, 57], "readthedoc": [35, 43], "real": 58, "reason": 52, "recommend": 51, "recurs": [39, 40, 50], "recursive_concat": [39, 40, 41, 50], "refer": [51, 54], "reinforc": [5, 7, 8, 13, 14, 41, 42, 44, 58], "relat": [9, 42], "relationship": 1, "replac": [18, 22, 26, 35, 41, 43, 44, 45, 46, 47], "repo": 57, "report": [52, 57], "repositori": 60, "requir": [9, 42], "reset": [5, 7, 8, 27, 28, 36, 37, 41, 42, 43, 48, 49, 61], "restor": [9, 42], "result": [9, 13, 14, 17, 18, 20, 22, 24, 26, 35, 36, 37, 42, 43, 44, 45, 46, 47, 49, 51, 52, 54, 57], "return": [5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 54], "return_buff": [20, 22, 44, 46], "return_buffer_idx": [20, 22, 44, 46], "reward": [10, 13, 14, 16, 17, 18, 22, 26, 42, 43, 44, 45, 46, 47, 53], "reward_mean": [42, 53, 54], "reward_std": [42, 53, 54], "rewardmean": [10, 41, 42], "rewardstd": [10, 41, 42], "rl": [5, 7, 8, 27, 28, 29, 30, 31, 32, 33, 34, 41, 42, 48, 51, 52, 54, 55], "rm": [21, 25, 46, 47], "rng": [13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 44, 45, 46, 47, 48, 49], "rng_kei": [15, 44], "run": [5, 6, 7, 8, 35, 41, 42, 43, 52, 54, 60], "run_arlbench": [5, 6, 41, 61], "runner": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "runner_st": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "running_statist": [41, 61], "runningstatisticsst": [17, 18, 20, 22, 24, 26, 35, 41, 43, 45, 46, 47], "runtim": [10, 41, 42, 53, 54], "sac": [13, 41, 42, 43, 44, 51, 52, 54, 58], "saccnnactor": [25, 44, 47], "saccnncrit": [25, 44, 47], "sacmetr": [24, 26, 44, 47], "sacmlpactor": [25, 44, 47], "sacmlpcrit": [25, 44, 47], "sacrunnerst": [13, 24, 26, 44, 47], "sacstat": [13, 24, 26, 44, 47], "sactrainingresult": [13, 24, 26, 44, 47], "sactrainreturnt": [13, 24, 26, 44, 47], "sactrainst": [13, 24, 26, 44, 47], "sacvectorcrit": [25, 44, 47], "safe": [19, 21, 25, 45, 46, 47], "same": [35, 39, 40, 43, 50], "sampl": [13, 14, 15, 17, 18, 20, 22, 23, 24, 26, 27, 28, 44, 45, 46, 47, 48, 58], "sample_act": [27, 28, 43, 48], "sample_batch_s": [23, 44], "save": [9, 41, 42, 54], "save_buff": [9, 41, 42], "save_defaults_to_yaml": [39, 40, 41, 50], "scalar": 42, "scalars_fil": [41, 42], "schedul": 54, "scope": [44, 45, 46, 47], "search": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47, 52, 54, 57, 58], "second": [39, 40, 50, 60], "section": 52, "see": [19, 21, 25, 35, 43, 45, 46, 47], "seed": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 30, 31, 33, 39, 40, 41, 42, 44, 45, 46, 47, 48, 50, 52, 54], "select": [51, 52, 53], "self": [10, 11, 19, 21, 25, 42, 45, 46, 47], "sequenc": [15, 23, 44], "sequence_length": [15, 44], "set": [16, 35, 43, 44, 54], "setup": [19, 21, 25, 44, 45, 46, 47], "sever": 52, "shape": [13, 14, 35, 43, 44], "share": [13, 14, 44], "should": [35, 43, 54, 57], "similar": [19, 21, 25, 45, 46, 47], "simplest": [52, 60], "simplifi": [35, 43], "sinc": 52, "singl": [9, 23, 42, 44], "size": [9, 13, 14, 15, 23, 42, 44], "so": 57, "soft": [13, 24, 26, 44, 47, 58], "sort": [10, 42], "sourc": [5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "space": [5, 7, 8, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50, 51, 52, 54, 57, 58], "specif": [10, 11, 42], "specifi": [18, 22, 26, 35, 43, 45, 46, 47], "stabil": 58, "stabl": [21, 25, 35, 43, 46, 47], "stable_baselines3": [21, 25, 46, 47], "standard": [10, 35, 42, 43, 53], "state": [5, 7, 8, 9, 11, 13, 14, 15, 17, 18, 20, 22, 24, 26, 27, 28, 35, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 54, 57], "state_featur": [41, 54, 61], "statefeatur": [11, 41, 42], "static": [9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 42, 44, 45, 46, 47, 54], "statist": [35, 43], "std": [35, 41, 43], "std_max_valu": [35, 43], "std_min_valu": [35, 43], "step": [5, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 41, 42, 43, 44, 45, 46, 47, 48, 49, 54, 61], "store": [9, 10, 11, 42], "str": [5, 7, 8, 9, 10, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 28, 33, 35, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 50], "string": [39, 40, 50], "strongli": 51, "structur": [35, 43, 52], "sub": [27, 28, 48], "submodul": [19, 21, 25, 61], "subpackag": 61, "subpag": 52, "subsequ": [10, 11, 42], "subset": 52, "summed_vari": [35, 41, 43], "support": [15, 27, 28, 44, 48, 52, 54], "surrog": 58, "system": 60, "t": [35, 43], "tag": [9, 42], "take": [27, 28, 36, 37, 48, 49, 54], "taken": [35, 43], "tanh": [19, 21, 25, 45, 46, 47], "tanhtransformeddistribut": [25, 44, 47], "target": [0, 13, 17, 18, 24, 26, 44, 45, 47, 52], "target_param": [13, 17, 18, 26, 44, 45, 47], "td_error": [13, 17, 18, 24, 26, 44, 45, 47], "termin": [5, 7, 8, 41, 42], "test": [52, 54], "than": [10, 42, 57], "thi": [3, 5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 19, 20, 21, 22, 24, 25, 26, 35, 41, 42, 43, 44, 45, 46, 47, 52, 53, 54, 57, 58, 60], "three": [19, 21, 25, 45, 46, 47, 52], "time": [23, 44], "timestep": [13, 14, 16, 17, 18, 20, 22, 24, 26, 43, 44, 45, 46, 47, 54], "to_tupl": [43, 44], "todo": 1, "tool": 54, "top": [5, 41], "torch_lay": [21, 25, 46, 47], "total": [5, 7, 8, 10, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 44, 45, 46, 47, 51, 54], "tpu": [23, 44], "track_metr": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "track_trajectori": [13, 14, 17, 18, 20, 22, 24, 26, 44, 45, 46, 47], "train": [5, 7, 8, 9, 10, 11, 13, 14, 17, 18, 20, 22, 24, 26, 41, 42, 43, 44, 45, 46, 47, 53, 54], "train_func": [10, 11, 42], "train_result": [9, 13, 14, 17, 18, 20, 22, 24, 26, 42, 44, 45, 46, 47], "train_stat": [13, 17, 18, 20, 22, 44, 45, 46], "trainfunc": [10, 11, 42], "training_result": [13, 14, 44], "trainingi": [13, 24, 26, 44, 47], "trainresult": [9, 42], "trainstat": [18, 22, 26, 45, 46, 47], "trajectori": [13, 15, 17, 18, 20, 22, 23, 24, 26, 44, 45, 46, 47], "trajectorybufferst": [9, 42], "transform": [25, 47], "transit": [13, 17, 18, 20, 22, 23, 24, 26, 44, 45, 46, 47], "transitionsampl": [15, 44], "true": [13, 14, 17, 18, 19, 20, 21, 22, 24, 26, 35, 43, 44, 45, 46, 47], "truncat": [5, 7, 8, 41, 42], "tupl": [5, 6, 7, 8, 9, 13, 14, 17, 18, 20, 22, 24, 26, 27, 28, 36, 37, 39, 40, 41, 42, 44, 45, 46, 47, 48, 49, 50], "tuple1": [39, 40, 50], "tuple2": [39, 40, 50], "tuple_concat": [39, 40, 41, 50], "twice": [35, 43], "two": [10, 39, 40, 42, 50, 54, 60], "tx": [18, 22, 26, 45, 46, 47], "type": [5, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "u": [10, 11, 42], "under": 3, "uniform": [15, 44], "uniform_sampl": [15, 43, 44], "union": [20, 22, 24, 26, 44, 45, 46, 47, 48], "uniqu": [9, 42], "unus": [13, 20, 22, 24, 26, 44, 46, 47], "updat": [13, 14, 17, 18, 20, 22, 24, 26, 35, 41, 43, 44, 45, 46, 47], "update_actor": [13, 24, 26, 43, 44, 47], "update_alpha": [13, 24, 26, 43, 44, 47], "update_crit": [13, 24, 26, 43, 44, 47], "update_hpo_config": [13, 14, 43, 44], "upper": 54, "us": [5, 6, 7, 8, 10, 13, 14, 17, 18, 20, 22, 23, 24, 26, 27, 33, 35, 41, 42, 43, 44, 45, 46, 47, 48, 51, 52, 53, 54, 57, 58, 60], "usecas": 52, "util": [35, 41, 43, 61], "valid": [35, 43], "validate_shap": [35, 43], "valu": [13, 16, 18, 22, 24, 26, 35, 39, 40, 43, 44, 45, 46, 47, 50], "valueerror": [5, 7, 8, 41, 42], "varianc": [35, 43], "varieti": 52, "variou": [27, 28, 48], "vault": [9, 42], "vault_uuid": [9, 42], "version": 60, "via": 54, "view": [16, 44], "virtual": 60, "wa": [5, 7, 8, 9, 35, 41, 42, 43, 51], "wai": 60, "want": [52, 60], "we": [10, 11, 42, 51, 52, 54, 57], "weigh": 58, "weight": [13, 24, 26, 35, 43, 44, 47], "well": [9, 27, 28, 42, 48, 51, 55], "when": [19, 21, 25, 35, 43, 45, 46, 47, 57], "where": [9, 42, 57], "whether": [9, 10, 13, 14, 23, 24, 26, 42, 44, 47, 54], "which": [9, 19, 21, 25, 42, 45, 46, 47, 51, 52, 57], "while": [10, 11, 42, 54, 60], "wise": [39, 40, 50], "work": [19, 21, 25, 45, 46, 47, 57], "workflow": 52, "world": 58, "would": [57, 60], "wrap": [10, 11, 19, 21, 25, 36, 37, 42, 45, 46, 47, 49, 57], "wrapper": [27, 33, 41, 43, 48], "write": [39, 40, 50], "x": [19, 21, 25, 30, 45, 46, 47, 48], "xland": [27, 33, 34, 48, 54], "xland_env": [41, 43], "xlandenv": [34, 43, 48], "yaml": [39, 40, 50], "ye": 57, "yet": [19, 21, 25, 45, 46, 47], "you": [51, 52, 53, 57, 60], "your": [51, 52, 53, 57]}, "titles": ["Using the ARLBench States", "ARLBench and Different AutoRL Paradigms", "Dynamic Configuration in ARLBench", "Advanced Configuration Options", "API References", "arlbench", "arlbench.arlbench", "arlbench.autorl", "arlbench.autorl.autorl_env", "arlbench.autorl.checkpointing", "arlbench.autorl.objectives", "arlbench.autorl.state_features", "arlbench.core", "arlbench.core.algorithms", "arlbench.core.algorithms.algorithm", "arlbench.core.algorithms.buffers", "arlbench.core.algorithms.common", "arlbench.core.algorithms.dqn", "arlbench.core.algorithms.dqn.dqn", "arlbench.core.algorithms.dqn.models", "arlbench.core.algorithms.ppo", "arlbench.core.algorithms.ppo.models", "arlbench.core.algorithms.ppo.ppo", "arlbench.core.algorithms.prioritised_item_buffer", "arlbench.core.algorithms.sac", "arlbench.core.algorithms.sac.models", "arlbench.core.algorithms.sac.sac", "arlbench.core.environments", "arlbench.core.environments.autorl_env", "arlbench.core.environments.brax_env", "arlbench.core.environments.envpool_env", "arlbench.core.environments.gymnasium_env", "arlbench.core.environments.gymnax_env", "arlbench.core.environments.make_env", "arlbench.core.environments.xland_env", "arlbench.core.running_statistics", "arlbench.core.wrappers", "arlbench.core.wrappers.flatten_observation", "arlbench.core.wrappers.wrapper", "arlbench.utils", "arlbench.utils.common", "arlbench package", "arlbench.autorl package", "arlbench.core package", "arlbench.core.algorithms package", "arlbench.core.algorithms.dqn package", "arlbench.core.algorithms.ppo package", "arlbench.core.algorithms.sac package", "arlbench.core.environments package", "arlbench.core.wrappers package", "arlbench.utils package", "The ARLBench Subsets", "Benchmarking AutoRL Methods", "Objectives in ARLBench", "ARLBench Options", "Considerations for Seeding", "&lt;no title&gt;", "Frequently Asked Questions", "Glossary", "Home", "Installation", "arlbench"], "titleterms": {"The": 51, "advanc": 3, "algorithm": [13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 44, 45, 46, 47], "api": 4, "arlbench": [0, 1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 53, 54, 61], "ask": 57, "autorl": [1, 7, 8, 9, 10, 11, 42, 52], "autorl_env": [8, 28, 42, 48], "benchmark": 52, "brax_env": [29, 48], "buffer": [15, 44], "checkpoint": [9, 42], "common": [16, 40, 44, 50], "configur": [2, 3], "consider": 55, "content": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "core": [12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 43, 44, 45, 46, 47, 48, 49], "differ": 1, "dqn": [17, 18, 19, 45], "dynam": 2, "environ": [27, 28, 29, 30, 31, 32, 33, 34, 48], "envpool_env": [30, 48], "flatten_observ": [37, 49], "frequent": 57, "glossari": 58, "gymnasium_env": [31, 48], "gymnax_env": [32, 48], "home": 59, "instal": 60, "make_env": [33, 48], "method": 52, "model": [19, 21, 25, 45, 46, 47], "modul": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "object": [10, 42, 53], "option": [3, 54], "packag": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "paradigm": 1, "ppo": [20, 21, 22, 46], "prioritised_item_buff": [23, 44], "question": 57, "refer": 4, "running_statist": [35, 43], "sac": [24, 25, 26, 47], "seed": 55, "state": 0, "state_featur": [11, 42], "submodul": [41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "subpackag": [41, 43, 44], "subset": 51, "us": 0, "util": [39, 40, 50], "wrapper": [36, 37, 38, 49], "xland_env": [34, 48]}})
\ No newline at end of file