diff --git a/404.html b/404.html
index c851019..c8309eb 100644
--- a/404.html
+++ b/404.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="/content/circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="/content/circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="/content/quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/README/index.html b/README/index.html
index 304e31a..365aaa0 100644
--- a/README/index.html
+++ b/README/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/_images/CircuitTraining-Ariane-v0.gif b/_images/CircuitTraining-Ariane-v0.gif
new file mode 100644
index 0000000..9c1c9a4
Binary files /dev/null and b/_images/CircuitTraining-Ariane-v0.gif differ
diff --git a/_images/CircuitTraining-ToyMacro-v0.gif b/_images/CircuitTraining-ToyMacro-v0.gif
new file mode 100644
index 0000000..5bcf080
Binary files /dev/null and b/_images/CircuitTraining-ToyMacro-v0.gif differ
diff --git a/_images/gminiwob_scene.png b/_images/gminiwob_scene.png
new file mode 100644
index 0000000..d509d85
Binary files /dev/null and b/_images/gminiwob_scene.png differ
diff --git a/_static/img/gminiwob_scene.png b/_static/img/gminiwob_scene.png
new file mode 100644
index 0000000..d509d85
Binary files /dev/null and b/_static/img/gminiwob_scene.png differ
diff --git a/content/basic_usage/index.html b/content/basic_usage/index.html
index b5c1bbb..c3004d4 100644
--- a/content/basic_usage/index.html
+++ b/content/basic_usage/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
@@ -337,8 +336,19 @@ <h2>Quadruped Locomotion<a class="headerlink" href="#quadruped-locomotion" title
 </section>
 <section class="tex2jax_ignore mathjax_ignore" id="installation">
 <h1>Installation<a class="headerlink" href="#installation" title="Link to this heading">¶</a></h1>
-<p>Note: The pip installation is not available yet. Users should install from
-source for now.</p>
+<section id="installing-from-pypi">
+<h2>Installing from PyPI<a class="headerlink" href="#installing-from-pypi" title="Link to this heading">¶</a></h2>
+<p>To install A2Perf from PyPI, run the following command:</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>pip<span class="w"> </span>install<span class="w"> </span>a2perf
+</pre></div>
+</div>
+<p>You can also install specific domains by specifying the package name:</p>
+<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>pip<span class="w"> </span>install<span class="w"> </span>a2perf<span class="o">[</span>web-navigation<span class="o">]</span>
+pip<span class="w"> </span>install<span class="w"> </span>a2perf<span class="o">[</span>circuit-training<span class="o">]</span>
+pip<span class="w"> </span>install<span class="w"> </span>a2perf<span class="o">[</span>quadruped-locomotion<span class="o">]</span>
+</pre></div>
+</div>
+</section>
 <section id="installing-from-source">
 <h2>Installing from source<a class="headerlink" href="#installing-from-source" title="Link to this heading">¶</a></h2>
 <p><strong>Note:</strong> We highly recommend using Conda to manage your environment for
@@ -370,16 +380,6 @@ <h2>Installing from source<a class="headerlink" href="#installing-from-source" t
 <div class="highlight-bash notranslate"><div class="highlight"><pre><span></span>pip<span class="w"> </span>install<span class="w"> </span>.<span class="o">[</span>all<span class="o">]</span>
 </pre></div>
 </div>
-<p>Once pip installation becomes available, you’ll be able to install A2Perf
-directly:</p>
-<div class="highlight-bash notranslate"><div class="highlight"><pre><span></span><span class="c1"># Install all domains</span>
-pip<span class="w"> </span>install<span class="w"> </span>a2perf<span class="o">[</span>all<span class="o">]</span>
-<span class="c1"># Or install specific domains</span>
-pip<span class="w"> </span>install<span class="w"> </span>a2perf<span class="o">[</span>circuit-training<span class="o">]</span>
-pip<span class="w"> </span>install<span class="w"> </span>a2perf<span class="o">[</span>web-navigation<span class="o">]</span>
-pip<span class="w"> </span>install<span class="w"> </span>a2perf<span class="o">[</span>quadruped-locomotion<span class="o">]</span>
-</pre></div>
-</div>
 </li>
 </ol>
 </section>
@@ -449,6 +449,7 @@ <h2>Installing from source<a class="headerlink" href="#installing-from-source" t
 </ul>
 </li>
 <li><a class="reference internal" href="#installation">Installation</a><ul>
+<li><a class="reference internal" href="#installing-from-pypi">Installing from PyPI</a></li>
 <li><a class="reference internal" href="#installing-from-source">Installing from source</a></li>
 </ul>
 </li>
diff --git a/content/circuit_training/CircuitTraining-Ariane-v0.ipynb b/content/circuit_training/CircuitTraining-Ariane-v0.ipynb
deleted file mode 100644
index dc9383d..0000000
--- a/content/circuit_training/CircuitTraining-Ariane-v0.ipynb
+++ /dev/null
@@ -1,229 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Ariane"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-08-15T18:13:44.733493Z",
-     "start_time": "2024-08-15T18:13:39.500066Z"
-    }
-   },
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2024-08-15 14:13:40.063385: I tensorflow/core/util/port.cc:113] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.\n",
-      "2024-08-15 14:13:40.197600: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n",
-      "2024-08-15 14:13:40.197668: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n",
-      "2024-08-15 14:13:40.218491: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n",
-      "2024-08-15 14:13:40.269410: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
-      "To enable the following instructions: AVX2 AVX_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
-      "2024-08-15 14:13:40.963834: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n"
-     ]
-    }
-   ],
-   "source": [
-    "from a2perf.domains import circuit_training\n",
-    "import gymnasium as gym\n",
-    "\n",
-    "env = gym.make('CircuitTraining-Ariane-v0')"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<table>\n",
-    "    <tr>\n",
-    "        <th style=\"text-align:right\">Action Space</th>\n",
-    "        <td style=\"text-align:left\">Discrete(16384)</td>\n",
-    "    </tr>\n",
-    "    <tr>\n",
-    "        <th style=\"text-align:right\">Observation Space</th>\n",
-    "        <td style=\"text-align:left\">\n",
-    "            Dict('current_node': Box(0, 3499, (1,), int32), 'fake_net_heatmap': Box(0.0, 1.0, (16384,), float32), 'is_node_placed': Box(0, 1, (3500,), int32), 'locations_x': Box(0.0, 1.0, (3500,), float32), 'locations_y': Box(0.0, 1.0, (3500,), float32), 'mask': Box(0, 1, (16384,), int32), 'netlist_index': Box(0, 0, (1,), int32))\n",
-    "        </td>\n",
-    "    </tr>\n",
-    "    <tr>\n",
-    "        <th style=\"text-align:right\">Reward Range</th>\n",
-    "        <td style=\"text-align:left\">(0, 1)</td>\n",
-    "    </tr>\n",
-    "    <tr>\n",
-    "        <th style=\"text-align:right\">Creation</th>\n",
-    "        <td style=\"text-align:left\">gym.make(\"CircuitTraining-Ariane-v0\")</td>\n",
-    "    </tr>\n",
-    "</table>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Description\n",
-    "\n",
-    "Circuit Training is an open-source framework for generating chip floor plans with distributed deep reinforcement learning. This framework reproduces the methodology published in the Nature 2021 paper:\n",
-    "\n",
-    "A graph placement methodology for fast chip design. Azalia Mirhoseini, Anna Goldie, Mustafa Yazgan, Joe Wenjie Jiang, Ebrahim Songhori, Shen Wang, Young-Joon Lee, Eric Johnson, Omkar Pathak, Azade Nazi, Jiwoo Pak, Andy Tong, Kavya Srinivasa, William Hang, Emre Tuncer, Quoc V. Le, James Laudon, Richard Ho, Roger Carpenter & Jeff Dean, 2021. Nature, 594(7862), pp.207-212. [PDF]\n",
-    "\n",
-    "At each timestep, the agent must place a single macro onto the chip canvas. \n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Action Space\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-07-21T13:06:40.008121Z",
-     "start_time": "2024-07-21T13:06:40.004369Z"
-    }
-   },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "Discrete(16384)"
-      ]
-     },
-     "execution_count": 2,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "env.action_space"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Circuit Training represents the chip canvas as a grid. The action space corresponds to the different locations that the next macro can be placed onto the canvas. In the Ariane netlist case, the canvas is of size $128 \\times 128$, resulting in $16384$ possible actions."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Observation Encoding\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-07-21T13:13:09.395228Z",
-     "start_time": "2024-07-21T13:13:09.391323Z"
-    }
-   },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "Dict('current_node': Box(0, 3499, (1,), int32), 'fake_net_heatmap': Box(0.0, 1.0, (16384,), float32), 'is_node_placed': Box(0, 1, (3500,), int32), 'locations_x': Box(0.0, 1.0, (3500,), float32), 'locations_y': Box(0.0, 1.0, (3500,), float32), 'mask': Box(0, 1, (16384,), int32), 'netlist_index': Box(0, 0, (1,), int32))"
-      ]
-     },
-     "execution_count": 3,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "env.observation_space"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "| Key | Description |\n",
-    "|-----|-------------|\n",
-    "| current_node | The node currently being considered for placement |\n",
-    "| fake_net_heatmap | A representation of estimated connections between nodes |\n",
-    "| is_node_placed | Indicates which nodes have already been placed on the chip |\n",
-    "| locations_x | The x-coordinates of placed nodes |\n",
-    "| locations_y | The y-coordinates of placed nodes |\n",
-    "| mask | Indicates which actions are valid in the current state |\n",
-    "| netlist_index | Identifier for the current netlist being processed |"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Rewards\n",
-    "\n",
-    "The reward is evaluated at the end of each episode. The placement cost binary is used to calculate the reward based on proxy wirelength, congestion, and density. An infeasible placement results in a reward of -1.0.\n",
-    "\n",
-    "The reward function is defined as:\n",
-    "\n",
-    "$$R(p, g) = -\\text{Wirelength}(p, g) - \\lambda \\cdot \\text{Congestion}(p, g) - \\gamma \\cdot \\text{Density}(p, g)$$\n",
-    "\n",
-    "Where:\n",
-    "- $p$ represents the placement\n",
-    "- $g$ represents the netlist graph\n",
-    "- $\\lambda$ is the congestion weight\n",
-    "- $\\gamma$ is the density weight\n",
-    "\n",
-    "Default values in A2Perf:\n",
-    "- The congestion weight $\\lambda$ is set to 0.01\n",
-    "- The density weight $\\gamma$ is set to 0.01 \n",
-    "- The maximum density threshold is set to 0.6\n",
-    "\n",
-    "These default values are based on the methodology described in [Mirhoseini et al. (2021)][1].\n",
-    "\n",
-    "[1]: https://www.nature.com/articles/s41586-021-03544-w \"A graph placement methodology for fast chip design\""
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Termination\n",
-    "\n",
-    "The episode is terminated once all macros have been placed on the canvas, then the final reward is calculated."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Registered Configurations\n",
-    "* `CircuitTraining-Ariane-v0`"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": []
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "name": "python"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/content/circuit_training/CircuitTraining-Ariane-v0/index.html b/content/circuit_training/CircuitTraining-Ariane-v0/index.html
index a798bfe..c9d8643 100644
--- a/content/circuit_training/CircuitTraining-Ariane-v0/index.html
+++ b/content/circuit_training/CircuitTraining-Ariane-v0/index.html
@@ -8,14 +8,13 @@
     <meta property="og:type" content="website" />
     <meta property="og:description" content="A2Perf is a benchmarking suite for evaluating autonomous agents on real-world problems." />
     <meta property="og:url" content="https://a2perf.farama.org/content/circuit_training/CircuitTraining-Ariane-v0.html" /><meta property="og:image" content="https://a2perf.farama.org/_static/_static/img/logo/vectors/A2Perf-github.svg" /><meta name="twitter:card" content="summary_large_image"><meta name="viewport" content="width=device-width, initial-scale=1" />
-<link rel="index" title="Index" href="../../../genindex/" /><link rel="search" title="Search" href="../../../search/" /><link rel="next" title="Toy Macro Standard Cell" href="../CircuitTraining-ToyMacroStdcell-v0/" /><link rel="prev" title="Circuit Training Environments" href="../" />
+<link rel="index" title="Index" href="../../../genindex/" /><link rel="search" title="Search" href="../../../search/" /><link rel="next" title="Quadruped Locomotion Environments" href="../../quadruped_locomotion/" /><link rel="prev" title="Circuit Training Environments" href="../" />
         <link rel="canonical" href="https://a2perf.farama.org/content/circuit_training/CircuitTraining-Ariane-v0.html" />
 
     <link rel="shortcut icon" href="../../../_static/A2Perf-favicon.png"/><!-- Generated with Sphinx 7.4.7 and Furo 2023.08.19.dev1 -->
         <title>Ariane - A2Perf Documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=a746c00c" />
     <link rel="stylesheet" type="text/css" href="../../../_static/styles/furo.css?v=3e7f4c72" />
-    <link rel="stylesheet" type="text/css" href="../../../_static/nbsphinx-code-cells.css?v=2aa19091" />
     <link rel="stylesheet" type="text/css" href="../../../_static/styles/furo-extensions.css?v=49cbaffd" />
     
     
@@ -221,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 current has-children"><a class="reference internal" href="../">Circuit Training Environments</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul class="current">
 <li class="toctree-l2 current current-page"><a class="current reference internal" href="#">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
@@ -271,7 +269,7 @@
             <span>Back to top</span>
           </a>
           <div class="content-icon-container"><div class="edit-this-page">
-  <a class="muted-link" href="https://github.com/Farama-Foundation/A2Perf/edit/main/docs/content/circuit_training/CircuitTraining-Ariane-v0.ipynb" title="Edit this page">
+  <a class="muted-link" href="https://github.com/Farama-Foundation/A2Perf/edit/main/docs/content/circuit_training/CircuitTraining-Ariane-v0.md" title="Edit this page">
     <svg aria-hidden="true" viewBox="0 0 24 24" stroke-width="1.5" stroke="currentColor" fill="none" stroke-linecap="round" stroke-linejoin="round">
       <path stroke="none" d="M0 0h24v24H0z" fill="none"/>
       <path d="M4 20h4l10.5 -10.5a1.5 1.5 0 0 0 -4 -4l-10.5 10.5v4" />
@@ -302,138 +300,222 @@
           </div>
           <article role="main">
             
-            <section id="Ariane">
-<h1>Ariane<a class="headerlink" href="#Ariane" title="Link to this heading">¶</a></h1>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[1]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">a2perf.domains</span> <span class="kn">import</span> <span class="n">circuit_training</span>
+            <section class="tex2jax_ignore mathjax_ignore" id="ariane">
+<h1>Ariane<a class="headerlink" href="#ariane" title="Link to this heading">¶</a></h1>
+<p><img alt="The Ariane RISC-V CPU" src="../../../_images/CircuitTraining-Ariane-v0.gif" /></p>
+<section id="environment-creation">
+<h2>Environment Creation<a class="headerlink" href="#environment-creation" title="Link to this heading">¶</a></h2>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">a2perf.domains</span> <span class="kn">import</span> <span class="n">circuit_training</span>
 <span class="kn">import</span> <span class="nn">gymnasium</span> <span class="k">as</span> <span class="nn">gym</span>
 
 <span class="n">env</span> <span class="o">=</span> <span class="n">gym</span><span class="o">.</span><span class="n">make</span><span class="p">(</span><span class="s1">&#39;CircuitTraining-Ariane-v0&#39;</span><span class="p">)</span>
 </pre></div>
 </div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt empty docutils container">
-</div>
-<div class="output_area stderr docutils container">
-<div class="highlight"><pre>
-2024-08-15 14:13:40.063385: I tensorflow/core/util/port.cc:113] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
-2024-08-15 14:13:40.197600: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
-2024-08-15 14:13:40.197668: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
-2024-08-15 14:13:40.218491: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
-2024-08-15 14:13:40.269410: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
-To enable the following instructions: AVX2 AVX_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
-2024-08-15 14:13:40.963834: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT
-</pre></div></div>
-</div>
-<table><tr><th style="text-align:right"><p>Action Space</p>
-</th><td style="text-align:left"><p>Discrete(16384)</p>
-</td></tr><tr><th style="text-align:right"><p>Observation Space</p>
-</th><td style="text-align:left"><p>Dict(‘current_node’: Box(0, 3499, (1,), int32), ‘fake_net_heatmap’: Box(0.0, 1.0, (16384,), float32), ‘is_node_placed’: Box(0, 1, (3500,), int32), ‘locations_x’: Box(0.0, 1.0, (3500,), float32), ‘locations_y’: Box(0.0, 1.0, (3500,), float32), ‘mask’: Box(0, 1, (16384,), int32), ‘netlist_index’: Box(0, 0, (1,), int32))</p>
-</td></tr><tr><th style="text-align:right"><p>Reward Range</p>
-</th><td style="text-align:left"><p>(0, 1)</p>
-</td></tr><tr><th style="text-align:right"><p>Creation</p>
-</th><td style="text-align:left"><p>gym.make(“CircuitTraining-Ariane-v0”)</p>
-</td></tr></table><section id="Description">
-<h2>Description<a class="headerlink" href="#Description" title="Link to this heading">¶</a></h2>
-<p>Circuit Training is an open-source framework for generating chip floor plans with distributed deep reinforcement learning. This framework reproduces the methodology published in the Nature 2021 paper:</p>
-<p>A graph placement methodology for fast chip design. Azalia Mirhoseini, Anna Goldie, Mustafa Yazgan, Joe Wenjie Jiang, Ebrahim Songhori, Shen Wang, Young-Joon Lee, Eric Johnson, Omkar Pathak, Azade Nazi, Jiwoo Pak, Andy Tong, Kavya Srinivasa, William Hang, Emre Tuncer, Quoc V. Le, James Laudon, Richard Ho, Roger Carpenter &amp; Jeff Dean, 2021. Nature, 594(7862), pp.207-212. [PDF]</p>
-<p>At each timestep, the agent must place a single macro onto the chip canvas.</p>
-</section>
-<section id="Action-Space">
-<h2>Action Space<a class="headerlink" href="#Action-Space" title="Link to this heading">¶</a></h2>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[2]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">env</span><span class="o">.</span><span class="n">action_space</span>
-</pre></div>
-</div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[2]:
-</pre></div>
-</div>
-<div class="output_area docutils container">
-<div class="highlight"><pre>
-Discrete(16384)
-</pre></div></div>
-</div>
-<p>Circuit Training represents the chip canvas as a grid. The action space corresponds to the different locations that the next macro can be placed onto the canvas. In the Ariane netlist case, the canvas is of size <span class="math notranslate nohighlight">\(128 \times 128\)</span>, resulting in <span class="math notranslate nohighlight">\(16384\)</span> possible actions.</p>
-</section>
-<section id="Observation-Encoding">
-<h2>Observation Encoding<a class="headerlink" href="#Observation-Encoding" title="Link to this heading">¶</a></h2>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[3]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">env</span><span class="o">.</span><span class="n">observation_space</span>
-</pre></div>
-</div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[3]:
-</pre></div>
-</div>
-<div class="output_area docutils container">
-<div class="highlight"><pre>
-Dict(&#39;current_node&#39;: Box(0, 3499, (1,), int32), &#39;fake_net_heatmap&#39;: Box(0.0, 1.0, (16384,), float32), &#39;is_node_placed&#39;: Box(0, 1, (3500,), int32), &#39;locations_x&#39;: Box(0.0, 1.0, (3500,), float32), &#39;locations_y&#39;: Box(0.0, 1.0, (3500,), float32), &#39;mask&#39;: Box(0, 1, (16384,), int32), &#39;netlist_index&#39;: Box(0, 0, (1,), int32))
-</pre></div></div>
-</div>
-<div class="table-wrapper docutils container">
+<section id="optional-parameters">
+<h3>Optional parameters:<a class="headerlink" href="#optional-parameters" title="Link to this heading">¶</a></h3>
+<div class="table-wrapper colwidths-auto docutils container">
 <table class="docutils align-default">
 <thead>
-<tr class="row-odd"><th class="head"><p>Key</p></th>
+<tr class="row-odd"><th class="head"><p>Parameter</p></th>
+<th class="head"><p>Type</p></th>
+<th class="head"><p>Default</p></th>
 <th class="head"><p>Description</p></th>
 </tr>
 </thead>
 <tbody>
-<tr class="row-even"><td><p>current_node</p></td>
-<td><p>The node currently being considered for placement</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">netlist_file</span></code></p></td>
+<td><p>str</p></td>
+<td><p>path to <code class="docutils literal notranslate"><span class="pre">netlist.pb.txt</span></code></p></td>
+<td><p>Path to the input netlist file. Predefined by using <code class="docutils literal notranslate"><span class="pre">Ariane</span></code> or <code class="docutils literal notranslate"><span class="pre">ToyMacro</span></code>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">init_placement</span></code></p></td>
+<td><p>str</p></td>
+<td><p>path to <code class="docutils literal notranslate"><span class="pre">initial.plc</span></code></p></td>
+<td><p>Path to the input initial placement file, used to read grid and canvas size. Predefined by using <code class="docutils literal notranslate"><span class="pre">Ariane</span></code> or <code class="docutils literal notranslate"><span class="pre">ToyMacro</span></code>.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">plc_wrapper_main</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">a2perf/domains/circuit_training/bin/plc_wrapper_main</span></code></p></td>
+<td><p>Main PLC wrapper.</p></td>
 </tr>
-<tr class="row-odd"><td><p>fake_net_heatmap</p></td>
-<td><p>A representation of estimated connections between nodes</p></td>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">create_placement_cost_fn</span></code></p></td>
+<td><p>Callable</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">placement_util.create_placement_cost</span></code></p></td>
+<td><p>A function that creates the <code class="docutils literal notranslate"><span class="pre">PlacementCost</span></code> object given the netlist and initial placement file.</p></td>
 </tr>
-<tr class="row-even"><td><p>is_node_placed</p></td>
-<td><p>Indicates which nodes have already been placed on the chip</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">std_cell_placer_mode</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">'fd'</span></code></p></td>
+<td><p>Options for fast standard cells placement. The <code class="docutils literal notranslate"><span class="pre">fd</span></code> option uses the force-directed algorithm.</p></td>
 </tr>
-<tr class="row-odd"><td><p>locations_x</p></td>
-<td><p>The x-coordinates of placed nodes</p></td>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">cost_info_fn</span></code></p></td>
+<td><p>Callable</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">cost_info_function</span></code></p></td>
+<td><p>The cost function that, given the <code class="docutils literal notranslate"><span class="pre">plc</span></code> object, returns the RL cost.</p></td>
 </tr>
-<tr class="row-even"><td><p>locations_y</p></td>
-<td><p>The y-coordinates of placed nodes</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">global_seed</span></code></p></td>
+<td><p>int</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">0</span></code></p></td>
+<td><p>Global seed for initializing environment features, ensuring consistency across actors.</p></td>
 </tr>
-<tr class="row-odd"><td><p>mask</p></td>
-<td><p>Indicates which actions are valid in the current state</p></td>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">netlist_index</span></code></p></td>
+<td><p>int</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">0</span></code></p></td>
+<td><p>Netlist index in the model static features.</p></td>
 </tr>
-<tr class="row-even"><td><p>netlist_index</p></td>
-<td><p>Identifier for the current netlist being processed</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">is_eval</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If set, saves the final placement in <code class="docutils literal notranslate"><span class="pre">output_dir</span></code>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">save_best_cost</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If set, saves the placement if its cost is better than the previously saved placement.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">output_plc_file</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">''</span></code></p></td>
+<td><p>The path to save the final placement.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">cd_finetune</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If True, runs coordinate descent to fine-tune macro orientations. Meant for evaluation, not training.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">cd_plc_file</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">'ppo_cd_placement.plc'</span></code></p></td>
+<td><p>Name of the coordinate descent fine-tuned <code class="docutils literal notranslate"><span class="pre">plc</span></code> file, saved in the same directory as <code class="docutils literal notranslate"><span class="pre">output_plc_file</span></code>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">train_step</span></code></p></td>
+<td><p>Optional[tf.Variable]</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">None</span></code></p></td>
+<td><p>A <code class="docutils literal notranslate"><span class="pre">tf.Variable</span></code> indicating the training step, used for saving <code class="docutils literal notranslate"><span class="pre">plc</span></code> files during evaluation.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">output_all_features</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, outputs all observation features. Otherwise, only outputs dynamic observations.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">node_order</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">'descending_size_macro_first'</span></code></p></td>
+<td><p>The sequence order of nodes placed by RL.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">save_snapshot</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">True</span></code></p></td>
+<td><p>If true, saves the snapshot placement.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">save_partial_placement</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, evaluation also saves the placement even if RL does not place all nodes when an episode is done.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">use_legacy_reset</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, uses the legacy reset method.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">use_legacy_step</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, uses the legacy step method.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">render_mode</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">None</span></code></p></td>
+<td><p>Specifies the rendering mode <code class="docutils literal notranslate"><span class="pre">human</span></code> or <code class="docutils literal notranslate"><span class="pre">rgb_array</span></code>, if any.</p></td>
 </tr>
 </tbody>
 </table>
 </div>
 </section>
-<section id="Rewards">
-<h2>Rewards<a class="headerlink" href="#Rewards" title="Link to this heading">¶</a></h2>
-<p>The reward is evaluated at the end of each episode. The placement cost binary is used to calculate the reward based on proxy wirelength, congestion, and density. An infeasible placement results in a reward of -1.0.</p>
+</section>
+<section id="description">
+<h2>Description<a class="headerlink" href="#description" title="Link to this heading">¶</a></h2>
+<p>Circuit Training is an open-source framework for generating chip floor plans
+with distributed deep reinforcement learning. This framework reproduces the
+methodology published in the Nature 2021 paper:</p>
+<p>A graph placement methodology for fast chip design. Azalia Mirhoseini, Anna
+Goldie, Mustafa Yazgan, Joe Wenjie Jiang, Ebrahim Songhori, Shen Wang,
+Young-Joon Lee, Eric Johnson, Omkar Pathak, Azade Nazi, Jiwoo Pak, Andy Tong,
+Kavya Srinivasa, William Hang, Emre Tuncer, Quoc V. Le, James Laudon, Richard
+Ho, Roger Carpenter &amp; Jeff Dean, 2021. Nature, 594(7862), pp.207-212. [PDF]</p>
+<p>At each timestep, the agent must place a single macro onto the chip canvas.</p>
+<p><strong>Note</strong>: this environment is only supported on Linux based OSes.</p>
+</section>
+<section id="action-space">
+<h2>Action Space<a class="headerlink" href="#action-space" title="Link to this heading">¶</a></h2>
+<p>Circuit Training represents the chip canvas as a grid.
+The action space corresponds to the different locations that the next macro can
+be placed onto the canvas without violating any hard constraints on density or
+blockages.
+At each step, the agent places a macro. Once all macros are placed, a
+force-directed method is used to place clusters of standard cells.</p>
+</section>
+<section id="observation-space">
+<h2>Observation Space<a class="headerlink" href="#observation-space" title="Link to this heading">¶</a></h2>
+<p>The observation space encodes information about the partial placement of the
+circuit.
+This includes:</p>
+<ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">current_node</span></code>: the current node to be placed, which is a single integer
+ranging from 0 to 3499.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">fake_net_heatmap</span></code>: a fake net heatmap, which provides a continuous
+representation of the heatmap with values between 0.0 and 1.0 across 16,384
+points.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">is_node_placed</span></code>: the placement status of nodes, a binary array of size 3500,
+showing whether each node has been placed (1) or not (0).</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">locations_x</span></code>: node locations in the x-axis, a continuous array of size 3500
+with values ranging from 0.0 to 1.0, representing the x-coordinates of the
+nodes.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">locations_y</span></code>: node locations in the y-axis, similar to locations_x, but for
+the y-coordinates.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">mask</span></code>: a mask, a binary array of size 16,384 indicating the validity or
+usability of each point in the net heatmap.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">netlist_index</span></code>: a netlist index. This usually acts as a placeholder, and is
+fixed at 0.</p></li>
+</ul>
+</section>
+<section id="rewards">
+<h2>Rewards<a class="headerlink" href="#rewards" title="Link to this heading">¶</a></h2>
+<p>The reward is evaluated at the end of each episode. The placement cost binary is
+used to calculate the reward based on proxy wirelength, congestion, and density.
+An infeasible placement results in a reward of -1.0.</p>
 <p>The reward function is defined as:</p>
 <div class="math-wrapper docutils container">
 <div class="math notranslate nohighlight">
 \[R(p, g) = -\text{Wirelength}(p, g) - \lambda \cdot \text{Congestion}(p, g) - \gamma \cdot \text{Density}(p, g)\]</div>
 </div>
-<p>Where: - <span class="math notranslate nohighlight">\(p\)</span> represents the placement - <span class="math notranslate nohighlight">\(g\)</span> represents the netlist graph - <span class="math notranslate nohighlight">\(\lambda\)</span> is the congestion weight - <span class="math notranslate nohighlight">\(\gamma\)</span> is the density weight</p>
-<p>Default values in A2Perf: - The congestion weight <span class="math notranslate nohighlight">\(\lambda\)</span> is set to 0.01 - The density weight <span class="math notranslate nohighlight">\(\gamma\)</span> is set to 0.01 - The maximum density threshold is set to 0.6</p>
-<p>These default values are based on the methodology described in <a class="reference external" href="https://www.nature.com/articles/s41586-021-03544-w">Mirhoseini et al. (2021)</a>.</p>
+<p>Where:</p>
+<ul class="simple">
+<li><p><span class="math notranslate nohighlight">\(p\)</span> represents the placement</p></li>
+<li><p><span class="math notranslate nohighlight">\(g\)</span> represents the netlist graph</p></li>
+<li><p><span class="math notranslate nohighlight">\(\lambda\)</span> is the congestion weight</p></li>
+<li><p><span class="math notranslate nohighlight">\(\gamma\)</span> is the density weight</p></li>
+</ul>
+<p>Default values in A2Perf:</p>
+<ul class="simple">
+<li><p>The congestion weight <span class="math notranslate nohighlight">\(\lambda\)</span> is set to 0.01</p></li>
+<li><p>The density weight <span class="math notranslate nohighlight">\(\gamma\)</span> is set to 0.01</p></li>
+<li><p>The maximum density threshold is set to 0.6</p></li>
+</ul>
+<p>These default values are based on the methodology described
+in <a class="reference external" href="https://www.nature.com/articles/s41586-021-03544-w" title="A graph placement methodology for fast chip design">Mirhoseini et al. (2021)</a>.</p>
 </section>
-<section id="Termination">
-<h2>Termination<a class="headerlink" href="#Termination" title="Link to this heading">¶</a></h2>
-<p>The episode is terminated once all macros have been placed on the canvas, then the final reward is calculated.</p>
+<section id="episode-end">
+<h2>Episode End<a class="headerlink" href="#episode-end" title="Link to this heading">¶</a></h2>
+<p>The episode ends when all nodes have been placed.</p>
 </section>
-<section id="Registered-Configurations">
-<h2>Registered Configurations<a class="headerlink" href="#Registered-Configurations" title="Link to this heading">¶</a></h2>
+<section id="termination">
+<h2>Termination<a class="headerlink" href="#termination" title="Link to this heading">¶</a></h2>
+<p>The episode is terminated once all macros have been placed on the canvas, then
+the final reward is calculated.</p>
+</section>
+<section id="registered-configurations">
+<h2>Registered Configurations<a class="headerlink" href="#registered-configurations" title="Link to this heading">¶</a></h2>
 <ul class="simple">
 <li><p><code class="docutils literal notranslate"><span class="pre">CircuitTraining-Ariane-v0</span></code></p></li>
 </ul>
@@ -445,12 +527,12 @@ <h2>Registered Configurations<a class="headerlink" href="#Registered-Configurati
         <footer>
           
           <div class="related-pages">
-            <a class="next-page" href="../CircuitTraining-ToyMacroStdcell-v0/">
+            <a class="next-page" href="../../quadruped_locomotion/">
               <div class="page-info">
                 <div class="context">
                   <span>Next</span>
                 </div>
-                <div class="title">Toy Macro Standard Cell</div>
+                <div class="title">Quadruped Locomotion Environments</div>
               </div>
               <svg class="furo-related-icon">
                 <use href="#svg-arrow-right"></use>
@@ -510,12 +592,17 @@ <h2>Registered Configurations<a class="headerlink" href="#Registered-Configurati
             <div class="toc-tree">
               <ul>
 <li><a class="reference internal" href="#">Ariane</a><ul>
-<li><a class="reference internal" href="#Description">Description</a></li>
-<li><a class="reference internal" href="#Action-Space">Action Space</a></li>
-<li><a class="reference internal" href="#Observation-Encoding">Observation Encoding</a></li>
-<li><a class="reference internal" href="#Rewards">Rewards</a></li>
-<li><a class="reference internal" href="#Termination">Termination</a></li>
-<li><a class="reference internal" href="#Registered-Configurations">Registered Configurations</a></li>
+<li><a class="reference internal" href="#environment-creation">Environment Creation</a><ul>
+<li><a class="reference internal" href="#optional-parameters">Optional parameters:</a></li>
+</ul>
+</li>
+<li><a class="reference internal" href="#description">Description</a></li>
+<li><a class="reference internal" href="#action-space">Action Space</a></li>
+<li><a class="reference internal" href="#observation-space">Observation Space</a></li>
+<li><a class="reference internal" href="#rewards">Rewards</a></li>
+<li><a class="reference internal" href="#episode-end">Episode End</a></li>
+<li><a class="reference internal" href="#termination">Termination</a></li>
+<li><a class="reference internal" href="#registered-configurations">Registered Configurations</a></li>
 </ul>
 </li>
 </ul>
diff --git a/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/index.html b/content/circuit_training/CircuitTraining-ToyMacro-v0/index.html
similarity index 65%
rename from content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/index.html
rename to content/circuit_training/CircuitTraining-ToyMacro-v0/index.html
index 7992e09..fc24c87 100644
--- a/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/index.html
+++ b/content/circuit_training/CircuitTraining-ToyMacro-v0/index.html
@@ -7,15 +7,14 @@
     <meta property="og:title" content="A2Perf Documentation" />
     <meta property="og:type" content="website" />
     <meta property="og:description" content="A2Perf is a benchmarking suite for evaluating autonomous agents on real-world problems." />
-    <meta property="og:url" content="https://a2perf.farama.org/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0.html" /><meta property="og:image" content="https://a2perf.farama.org/_static/_static/img/logo/vectors/A2Perf-github.svg" /><meta name="twitter:card" content="summary_large_image"><meta name="viewport" content="width=device-width, initial-scale=1" />
-<link rel="index" title="Index" href="../../../genindex/" /><link rel="search" title="Search" href="../../../search/" /><link rel="next" title="Quadruped Locomotion Environments" href="../../quadruped_locomotion/" /><link rel="prev" title="Ariane" href="../CircuitTraining-Ariane-v0/" />
-        <link rel="canonical" href="https://a2perf.farama.org/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0.html" />
+    <meta property="og:url" content="https://a2perf.farama.org/content/circuit_training/CircuitTraining-ToyMacro-v0.html" /><meta property="og:image" content="https://a2perf.farama.org/_static/_static/img/logo/vectors/A2Perf-github.svg" /><meta name="twitter:card" content="summary_large_image"><meta name="viewport" content="width=device-width, initial-scale=1" />
+<link rel="index" title="Index" href="../../../genindex/" /><link rel="search" title="Search" href="../../../search/" />
+        <link rel="canonical" href="https://a2perf.farama.org/content/circuit_training/CircuitTraining-ToyMacro-v0.html" />
 
     <link rel="shortcut icon" href="../../../_static/A2Perf-favicon.png"/><!-- Generated with Sphinx 7.4.7 and Furo 2023.08.19.dev1 -->
-        <title>Toy Macro Standard Cell - A2Perf Documentation</title>
+        <title>Ariane - A2Perf Documentation</title>
       <link rel="stylesheet" type="text/css" href="../../../_static/pygments.css?v=a746c00c" />
     <link rel="stylesheet" type="text/css" href="../../../_static/styles/furo.css?v=3e7f4c72" />
-    <link rel="stylesheet" type="text/css" href="../../../_static/nbsphinx-code-cells.css?v=2aa19091" />
     <link rel="stylesheet" type="text/css" href="../../../_static/styles/furo-extensions.css?v=49cbaffd" />
     
     
@@ -218,10 +217,9 @@
 <li class="toctree-l1"><a class="reference internal" href="../../publications/">List of Publications</a></li>
 </ul>
 <p class="caption" role="heading"><span class="caption-text">Environments</span></p>
-<ul class="current">
-<li class="toctree-l1 current has-children"><a class="reference internal" href="../">Circuit Training Environments</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul class="current">
+<ul>
+<li class="toctree-l1 has-children"><a class="reference internal" href="../">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2 current current-page"><a class="current reference internal" href="#">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
@@ -271,7 +269,7 @@
             <span>Back to top</span>
           </a>
           <div class="content-icon-container"><div class="edit-this-page">
-  <a class="muted-link" href="https://github.com/Farama-Foundation/A2Perf/edit/main/docs/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0.ipynb" title="Edit this page">
+  <a class="muted-link" href="https://github.com/Farama-Foundation/A2Perf/edit/main/docs/content/circuit_training/CircuitTraining-ToyMacro-v0.md" title="Edit this page">
     <svg aria-hidden="true" viewBox="0 0 24 24" stroke-width="1.5" stroke="currentColor" fill="none" stroke-linecap="round" stroke-linejoin="round">
       <path stroke="none" d="M0 0h24v24H0z" fill="none"/>
       <path d="M4 20h4l10.5 -10.5a1.5 1.5 0 0 0 -4 -4l-10.5 10.5v4" />
@@ -302,180 +300,222 @@
           </div>
           <article role="main">
             
-            <section id="Toy-Macro-Standard-Cell">
-<h1>Toy Macro Standard Cell<a class="headerlink" href="#Toy-Macro-Standard-Cell" title="Link to this heading">¶</a></h1>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[3]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">a2perf.domains</span> <span class="kn">import</span> <span class="n">circuit_training</span>
+            <section class="tex2jax_ignore mathjax_ignore" id="ariane">
+<h1>Ariane<a class="headerlink" href="#ariane" title="Link to this heading">¶</a></h1>
+<p><img alt="The Toy Macro Standard Cell  CPU" src="../../../_images/CircuitTraining-ToyMacro-v0.gif" /></p>
+<section id="environment-creation">
+<h2>Environment Creation<a class="headerlink" href="#environment-creation" title="Link to this heading">¶</a></h2>
+<div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">a2perf.domains</span> <span class="kn">import</span> <span class="n">circuit_training</span>
 <span class="kn">import</span> <span class="nn">gymnasium</span> <span class="k">as</span> <span class="nn">gym</span>
 
 <span class="n">env</span> <span class="o">=</span> <span class="n">gym</span><span class="o">.</span><span class="n">make</span><span class="p">(</span><span class="s1">&#39;CircuitTraining-ToyMacro-v0&#39;</span><span class="p">)</span>
 </pre></div>
 </div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt empty docutils container">
-</div>
-<div class="output_area stderr docutils container">
-<div class="highlight"><pre>
-2024-07-21 13:47:36.273879: I tensorflow/core/util/port.cc:113] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
-2024-07-21 13:47:36.299009: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
-2024-07-21 13:47:36.299034: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
-2024-07-21 13:47:36.300083: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
-2024-07-21 13:47:36.304647: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.
-To enable the following instructions: AVX2 AVX_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.
-2024-07-21 13:47:36.808584: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT
-WARNING:absl:block_name is not set. Please add the block_name in:
-/home/ike2030/workspace/a2perf/repo_new/a2perf/domains/circuit_training/circuit_training/environment/test_data/toy_macro_stdcell/netlist.pb.txt
-or in:
-/home/ike2030/workspace/a2perf/repo_new/a2perf/domains/circuit_training/circuit_training/environment/test_data/toy_macro_stdcell/initial.plc
-/home/ike2030/miniconda3/envs/a2perf_circuit_training/lib/python3.10/site-packages/numpy/core/fromnumeric.py:3432: RuntimeWarning: Mean of empty slice.
-  return _methods._mean(a, axis=axis, dtype=dtype,
-/home/ike2030/miniconda3/envs/a2perf_circuit_training/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in divide
-  ret = ret.dtype.type(ret / rcount)
-/home/ike2030/miniconda3/envs/a2perf_circuit_training/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:32: UserWarning: <span class="ansi-yellow-fg">WARN: A Box observation space maximum and minimum values are equal. Actual equal coordinates: [(0,)]</span>
-  logger.warn(
-</pre></div></div>
-</div>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[4]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">env</span><span class="o">.</span><span class="n">observation_space</span>
-</pre></div>
-</div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[4]:
-</pre></div>
-</div>
-<div class="output_area docutils container">
-<div class="highlight"><pre>
-Dict(&#39;current_node&#39;: Box(0, 3499, (1,), int32), &#39;fake_net_heatmap&#39;: Box(0.0, 1.0, (16384,), float32), &#39;is_node_placed&#39;: Box(0, 1, (3500,), int32), &#39;locations_x&#39;: Box(0.0, 1.0, (3500,), float32), &#39;locations_y&#39;: Box(0.0, 1.0, (3500,), float32), &#39;mask&#39;: Box(0, 1, (16384,), int32), &#39;netlist_index&#39;: Box(0, 0, (1,), int32))
-</pre></div></div>
-</div>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[5]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">env</span><span class="o">.</span><span class="n">action_space</span>
-</pre></div>
-</div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[5]:
-</pre></div>
-</div>
-<div class="output_area docutils container">
-<div class="highlight"><pre>
-Discrete(16384)
-</pre></div></div>
-</div>
-<table><tr><th style="text-align:right"><p>Action Space</p>
-</th><td style="text-align:left"><p>Discrete(16384)</p>
-</td></tr><tr><th style="text-align:right"><p>Observation Space</p>
-</th><td style="text-align:left"><p>Dict(‘current_node’: Box(0, 3499, (1,), int32), ‘fake_net_heatmap’: Box(0.0, 1.0, (16384,), float32), ‘is_node_placed’: Box(0, 1, (3500,), int32), ‘locations_x’: Box(0.0, 1.0, (3500,), float32), ‘locations_y’: Box(0.0, 1.0, (3500,), float32), ‘mask’: Box(0, 1, (16384,), int32), ‘netlist_index’: Box(0, 0, (1,), int32))</p>
-</td></tr><tr><th style="text-align:right"><p>Creation</p>
-</th><td style="text-align:left"><p>gym.make(“CircuitTraining-ToyMacro-v0”)</p>
-</td></tr></table><section id="Description">
-<h2>Description<a class="headerlink" href="#Description" title="Link to this heading">¶</a></h2>
-<p>Circuit Training is an open-source framework for generating chip floor plans with distributed deep reinforcement learning. This framework reproduces the methodology published in the Nature 2021 paper:</p>
-<p>A graph placement methodology for fast chip design. Azalia Mirhoseini, Anna Goldie, Mustafa Yazgan, Joe Wenjie Jiang, Ebrahim Songhori, Shen Wang, Young-Joon Lee, Eric Johnson, Omkar Pathak, Azade Nazi, Jiwoo Pak, Andy Tong, Kavya Srinivasa, William Hang, Emre Tuncer, Quoc V. Le, James Laudon, Richard Ho, Roger Carpenter &amp; Jeff Dean, 2021. Nature, 594(7862), pp.207-212. [PDF]</p>
-<p>At each timestep, the agent must place a single macro onto the chip canvas.</p>
-</section>
-<section id="Action-Space">
-<h2>Action Space<a class="headerlink" href="#Action-Space" title="Link to this heading">¶</a></h2>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[7]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">env</span><span class="o">.</span><span class="n">action_space</span>
-</pre></div>
-</div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[7]:
-</pre></div>
-</div>
-<div class="output_area docutils container">
-<div class="highlight"><pre>
-Discrete(16384)
-</pre></div></div>
-</div>
-<p>Circuit Training represents the chip canvas as a grid. The action space corresponds to the different locations that the next macro can be placed onto the canvas. In the Toy Macro netlist case, the canvas is of size <span class="math notranslate nohighlight">\(128 \times 128\)</span>, resulting in <span class="math notranslate nohighlight">\(16384\)</span> possible actions.</p>
-</section>
-<section id="Observation-Encoding">
-<h2>Observation Encoding<a class="headerlink" href="#Observation-Encoding" title="Link to this heading">¶</a></h2>
-<div class="nbinput docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[8]:
-</pre></div>
-</div>
-<div class="input_area highlight-python notranslate"><div class="highlight"><pre><span></span><span class="n">env</span><span class="o">.</span><span class="n">observation_space</span>
-</pre></div>
-</div>
-</div>
-<div class="nboutput nblast docutils container">
-<div class="prompt highlight-none notranslate"><div class="highlight"><pre><span></span>[8]:
-</pre></div>
-</div>
-<div class="output_area docutils container">
-<div class="highlight"><pre>
-Dict(&#39;current_node&#39;: Box(0, 3499, (1,), int32), &#39;fake_net_heatmap&#39;: Box(0.0, 1.0, (16384,), float32), &#39;is_node_placed&#39;: Box(0, 1, (3500,), int32), &#39;locations_x&#39;: Box(0.0, 1.0, (3500,), float32), &#39;locations_y&#39;: Box(0.0, 1.0, (3500,), float32), &#39;mask&#39;: Box(0, 1, (16384,), int32), &#39;netlist_index&#39;: Box(0, 0, (1,), int32))
-</pre></div></div>
-</div>
-<div class="table-wrapper docutils container">
+<section id="optional-parameters">
+<h3>Optional parameters:<a class="headerlink" href="#optional-parameters" title="Link to this heading">¶</a></h3>
+<div class="table-wrapper colwidths-auto docutils container">
 <table class="docutils align-default">
 <thead>
-<tr class="row-odd"><th class="head"><p>Key</p></th>
+<tr class="row-odd"><th class="head"><p>Parameter</p></th>
+<th class="head"><p>Type</p></th>
+<th class="head"><p>Default</p></th>
 <th class="head"><p>Description</p></th>
 </tr>
 </thead>
 <tbody>
-<tr class="row-even"><td><p>current_node</p></td>
-<td><p>The node currently being considered for placement</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">netlist_file</span></code></p></td>
+<td><p>str</p></td>
+<td><p>path to <code class="docutils literal notranslate"><span class="pre">netlist.pb.txt</span></code></p></td>
+<td><p>Path to the input netlist file. Predefined by using <code class="docutils literal notranslate"><span class="pre">Ariane</span></code> or <code class="docutils literal notranslate"><span class="pre">ToyMacro</span></code>.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">init_placement</span></code></p></td>
+<td><p>str</p></td>
+<td><p>path to <code class="docutils literal notranslate"><span class="pre">initial.plc</span></code></p></td>
+<td><p>Path to the input initial placement file, used to read grid and canvas size. Predefined by using <code class="docutils literal notranslate"><span class="pre">Ariane</span></code> or <code class="docutils literal notranslate"><span class="pre">ToyMacro</span></code>.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">plc_wrapper_main</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">a2perf/domains/circuit_training/bin/plc_wrapper_main</span></code></p></td>
+<td><p>Main PLC wrapper.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">create_placement_cost_fn</span></code></p></td>
+<td><p>Callable</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">placement_util.create_placement_cost</span></code></p></td>
+<td><p>A function that creates the <code class="docutils literal notranslate"><span class="pre">PlacementCost</span></code> object given the netlist and initial placement file.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">std_cell_placer_mode</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">'fd'</span></code></p></td>
+<td><p>Options for fast standard cells placement. The <code class="docutils literal notranslate"><span class="pre">fd</span></code> option uses the force-directed algorithm.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">cost_info_fn</span></code></p></td>
+<td><p>Callable</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">cost_info_function</span></code></p></td>
+<td><p>The cost function that, given the <code class="docutils literal notranslate"><span class="pre">plc</span></code> object, returns the RL cost.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">global_seed</span></code></p></td>
+<td><p>int</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">0</span></code></p></td>
+<td><p>Global seed for initializing environment features, ensuring consistency across actors.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">netlist_index</span></code></p></td>
+<td><p>int</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">0</span></code></p></td>
+<td><p>Netlist index in the model static features.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">is_eval</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If set, saves the final placement in <code class="docutils literal notranslate"><span class="pre">output_dir</span></code>.</p></td>
 </tr>
-<tr class="row-odd"><td><p>fake_net_heatmap</p></td>
-<td><p>A representation of estimated connections between nodes</p></td>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">save_best_cost</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If set, saves the placement if its cost is better than the previously saved placement.</p></td>
 </tr>
-<tr class="row-even"><td><p>is_node_placed</p></td>
-<td><p>Indicates which nodes have already been placed on the chip</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">output_plc_file</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">''</span></code></p></td>
+<td><p>The path to save the final placement.</p></td>
 </tr>
-<tr class="row-odd"><td><p>locations_x</p></td>
-<td><p>The x-coordinates of placed nodes</p></td>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">cd_finetune</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If True, runs coordinate descent to fine-tune macro orientations. Meant for evaluation, not training.</p></td>
 </tr>
-<tr class="row-even"><td><p>locations_y</p></td>
-<td><p>The y-coordinates of placed nodes</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">cd_plc_file</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">'ppo_cd_placement.plc'</span></code></p></td>
+<td><p>Name of the coordinate descent fine-tuned <code class="docutils literal notranslate"><span class="pre">plc</span></code> file, saved in the same directory as <code class="docutils literal notranslate"><span class="pre">output_plc_file</span></code>.</p></td>
 </tr>
-<tr class="row-odd"><td><p>mask</p></td>
-<td><p>Indicates which actions are valid in the current state</p></td>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">train_step</span></code></p></td>
+<td><p>Optional[tf.Variable]</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">None</span></code></p></td>
+<td><p>A <code class="docutils literal notranslate"><span class="pre">tf.Variable</span></code> indicating the training step, used for saving <code class="docutils literal notranslate"><span class="pre">plc</span></code> files during evaluation.</p></td>
 </tr>
-<tr class="row-even"><td><p>netlist_index</p></td>
-<td><p>Identifier for the current netlist being processed</p></td>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">output_all_features</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, outputs all observation features. Otherwise, only outputs dynamic observations.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">node_order</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">'descending_size_macro_first'</span></code></p></td>
+<td><p>The sequence order of nodes placed by RL.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">save_snapshot</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">True</span></code></p></td>
+<td><p>If true, saves the snapshot placement.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">save_partial_placement</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, evaluation also saves the placement even if RL does not place all nodes when an episode is done.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">use_legacy_reset</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, uses the legacy reset method.</p></td>
+</tr>
+<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">use_legacy_step</span></code></p></td>
+<td><p>bool</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">False</span></code></p></td>
+<td><p>If true, uses the legacy step method.</p></td>
+</tr>
+<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">render_mode</span></code></p></td>
+<td><p>str</p></td>
+<td><p><code class="docutils literal notranslate"><span class="pre">None</span></code></p></td>
+<td><p>Specifies the rendering mode <code class="docutils literal notranslate"><span class="pre">human</span></code> or <code class="docutils literal notranslate"><span class="pre">rgb_array</span></code>, if any.</p></td>
 </tr>
 </tbody>
 </table>
 </div>
 </section>
-<section id="Rewards">
-<h2>Rewards<a class="headerlink" href="#Rewards" title="Link to this heading">¶</a></h2>
-<p>The reward is evaluated at the end of each episode. The placement cost binary is used to calculate the reward based on proxy wirelength, congestion, and density. An infeasible placement results in a reward of -1.0.</p>
+</section>
+<section id="description">
+<h2>Description<a class="headerlink" href="#description" title="Link to this heading">¶</a></h2>
+<p>Circuit Training is an open-source framework for generating chip floor plans
+with distributed deep reinforcement learning. This framework reproduces the
+methodology published in the Nature 2021 paper:</p>
+<p>A graph placement methodology for fast chip design. Azalia Mirhoseini, Anna
+Goldie, Mustafa Yazgan, Joe Wenjie Jiang, Ebrahim Songhori, Shen Wang,
+Young-Joon Lee, Eric Johnson, Omkar Pathak, Azade Nazi, Jiwoo Pak, Andy Tong,
+Kavya Srinivasa, William Hang, Emre Tuncer, Quoc V. Le, James Laudon, Richard
+Ho, Roger Carpenter &amp; Jeff Dean, 2021. Nature, 594(7862), pp.207-212. [PDF]</p>
+<p>At each timestep, the agent must place a single macro onto the chip canvas.</p>
+<p><strong>Note</strong>: this environment is only supported on Linux based OSes.</p>
+</section>
+<section id="action-space">
+<h2>Action Space<a class="headerlink" href="#action-space" title="Link to this heading">¶</a></h2>
+<p>Circuit Training represents the chip canvas as a grid.
+The action space corresponds to the different locations that the next macro can
+be placed onto the canvas without violating any hard constraints on density or
+blockages.
+At each step, the agent places a macro. Once all macros are placed, a
+force-directed method is used to place clusters of standard cells.</p>
+</section>
+<section id="observation-space">
+<h2>Observation Space<a class="headerlink" href="#observation-space" title="Link to this heading">¶</a></h2>
+<p>The observation space encodes information about the partial placement of the
+circuit.
+This includes:</p>
+<ul class="simple">
+<li><p><code class="docutils literal notranslate"><span class="pre">current_node</span></code>: the current node to be placed, which is a single integer
+ranging from 0 to 3499.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">fake_net_heatmap</span></code>: a fake net heatmap, which provides a continuous
+representation of the heatmap with values between 0.0 and 1.0 across 16,384
+points.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">is_node_placed</span></code>: the placement status of nodes, a binary array of size 3500,
+showing whether each node has been placed (1) or not (0).</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">locations_x</span></code>: node locations in the x-axis, a continuous array of size 3500
+with values ranging from 0.0 to 1.0, representing the x-coordinates of the
+nodes.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">locations_y</span></code>: node locations in the y-axis, similar to locations_x, but for
+the y-coordinates.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">mask</span></code>: a mask, a binary array of size 16,384 indicating the validity or
+usability of each point in the net heatmap.</p></li>
+<li><p><code class="docutils literal notranslate"><span class="pre">netlist_index</span></code>: a netlist index. This usually acts as a placeholder, and is
+fixed at 0.</p></li>
+</ul>
+</section>
+<section id="rewards">
+<h2>Rewards<a class="headerlink" href="#rewards" title="Link to this heading">¶</a></h2>
+<p>The reward is evaluated at the end of each episode. The placement cost binary is
+used to calculate the reward based on proxy wirelength, congestion, and density.
+An infeasible placement results in a reward of -1.0.</p>
 <p>The reward function is defined as:</p>
 <div class="math-wrapper docutils container">
 <div class="math notranslate nohighlight">
 \[R(p, g) = -\text{Wirelength}(p, g) - \lambda \cdot \text{Congestion}(p, g) - \gamma \cdot \text{Density}(p, g)\]</div>
 </div>
-<p>Where: - <span class="math notranslate nohighlight">\(p\)</span> represents the placement - <span class="math notranslate nohighlight">\(g\)</span> represents the netlist graph - <span class="math notranslate nohighlight">\(\lambda\)</span> is the congestion weight - <span class="math notranslate nohighlight">\(\gamma\)</span> is the density weight</p>
-<p>Default values in A2Perf: - The congestion weight <span class="math notranslate nohighlight">\(\lambda\)</span> is set to 0.01 - The density weight <span class="math notranslate nohighlight">\(\gamma\)</span> is set to 0.01 - The maximum density threshold is set to 0.6</p>
-<p>These default values are based on the methodology described in <a class="reference external" href="https://www.nature.com/articles/s41586-021-03544-w">Mirhoseini et al. (2021)</a>.</p>
+<p>Where:</p>
+<ul class="simple">
+<li><p><span class="math notranslate nohighlight">\(p\)</span> represents the placement</p></li>
+<li><p><span class="math notranslate nohighlight">\(g\)</span> represents the netlist graph</p></li>
+<li><p><span class="math notranslate nohighlight">\(\lambda\)</span> is the congestion weight</p></li>
+<li><p><span class="math notranslate nohighlight">\(\gamma\)</span> is the density weight</p></li>
+</ul>
+<p>Default values in A2Perf:</p>
+<ul class="simple">
+<li><p>The congestion weight <span class="math notranslate nohighlight">\(\lambda\)</span> is set to 0.01</p></li>
+<li><p>The density weight <span class="math notranslate nohighlight">\(\gamma\)</span> is set to 0.01</p></li>
+<li><p>The maximum density threshold is set to 0.6</p></li>
+</ul>
+<p>These default values are based on the methodology described
+in <a class="reference external" href="https://www.nature.com/articles/s41586-021-03544-w" title="A graph placement methodology for fast chip design">Mirhoseini et al. (2021)</a>.</p>
 </section>
-<section id="Termination">
-<h2>Termination<a class="headerlink" href="#Termination" title="Link to this heading">¶</a></h2>
-<p>The episode is terminated once all macros have been placed on the canvas, then the final reward is calculated.</p>
+<section id="episode-end">
+<h2>Episode End<a class="headerlink" href="#episode-end" title="Link to this heading">¶</a></h2>
+<p>The episode ends when all nodes have been placed.</p>
 </section>
-<section id="Registered-Configurations">
-<h2>Registered Configurations<a class="headerlink" href="#Registered-Configurations" title="Link to this heading">¶</a></h2>
+<section id="termination">
+<h2>Termination<a class="headerlink" href="#termination" title="Link to this heading">¶</a></h2>
+<p>The episode is terminated once all macros have been placed on the canvas, then
+the final reward is calculated.</p>
+</section>
+<section id="registered-configurations">
+<h2>Registered Configurations<a class="headerlink" href="#registered-configurations" title="Link to this heading">¶</a></h2>
 <ul class="simple">
 <li><p><code class="docutils literal notranslate"><span class="pre">CircuitTraining-ToyMacro-v0</span></code></p></li>
 </ul>
@@ -487,30 +527,8 @@ <h2>Registered Configurations<a class="headerlink" href="#Registered-Configurati
         <footer>
           
           <div class="related-pages">
-            <a class="next-page" href="../../quadruped_locomotion/">
-              <div class="page-info">
-                <div class="context">
-                  <span>Next</span>
-                </div>
-                <div class="title">Quadruped Locomotion Environments</div>
-              </div>
-              <svg class="furo-related-icon">
-                <use href="#svg-arrow-right"></use>
-              </svg>
-            </a>
-            <a class="prev-page" href="../CircuitTraining-Ariane-v0/">
-              <svg class="furo-related-icon">
-                <use href="#svg-arrow-right"></use>
-              </svg>
-              <div class="page-info">
-                <div class="context">
-                  <span>Previous</span>
-                </div>
-                
-                <div class="title">Ariane</div>
-                
-              </div>
-            </a>
+            
+            
           </div>
           <div class="bottom-of-page">
             <div class="left-details">
@@ -551,13 +569,18 @@ <h2>Registered Configurations<a class="headerlink" href="#Registered-Configurati
           <div class="toc-tree-container">
             <div class="toc-tree">
               <ul>
-<li><a class="reference internal" href="#">Toy Macro Standard Cell</a><ul>
-<li><a class="reference internal" href="#Description">Description</a></li>
-<li><a class="reference internal" href="#Action-Space">Action Space</a></li>
-<li><a class="reference internal" href="#Observation-Encoding">Observation Encoding</a></li>
-<li><a class="reference internal" href="#Rewards">Rewards</a></li>
-<li><a class="reference internal" href="#Termination">Termination</a></li>
-<li><a class="reference internal" href="#Registered-Configurations">Registered Configurations</a></li>
+<li><a class="reference internal" href="#">Ariane</a><ul>
+<li><a class="reference internal" href="#environment-creation">Environment Creation</a><ul>
+<li><a class="reference internal" href="#optional-parameters">Optional parameters:</a></li>
+</ul>
+</li>
+<li><a class="reference internal" href="#description">Description</a></li>
+<li><a class="reference internal" href="#action-space">Action Space</a></li>
+<li><a class="reference internal" href="#observation-space">Observation Space</a></li>
+<li><a class="reference internal" href="#rewards">Rewards</a></li>
+<li><a class="reference internal" href="#episode-end">Episode End</a></li>
+<li><a class="reference internal" href="#termination">Termination</a></li>
+<li><a class="reference internal" href="#registered-configurations">Registered Configurations</a></li>
 </ul>
 </li>
 </ul>
diff --git a/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0.ipynb b/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0.ipynb
deleted file mode 100644
index 0aecc75..0000000
--- a/content/circuit_training/CircuitTraining-ToyMacroStdcell-v0.ipynb
+++ /dev/null
@@ -1,281 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Toy Macro Standard Cell"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-07-21T17:47:38.578728Z",
-     "start_time": "2024-07-21T17:47:35.999779Z"
-    }
-   },
-   "outputs": [
-    {
-     "name": "stderr",
-     "output_type": "stream",
-     "text": [
-      "2024-07-21 13:47:36.273879: I tensorflow/core/util/port.cc:113] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.\n",
-      "2024-07-21 13:47:36.299009: E external/local_xla/xla/stream_executor/cuda/cuda_dnn.cc:9261] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n",
-      "2024-07-21 13:47:36.299034: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:607] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n",
-      "2024-07-21 13:47:36.300083: E external/local_xla/xla/stream_executor/cuda/cuda_blas.cc:1515] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n",
-      "2024-07-21 13:47:36.304647: I tensorflow/core/platform/cpu_feature_guard.cc:182] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
-      "To enable the following instructions: AVX2 AVX_VNNI FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n",
-      "2024-07-21 13:47:36.808584: W tensorflow/compiler/tf2tensorrt/utils/py_utils.cc:38] TF-TRT Warning: Could not find TensorRT\n",
-      "WARNING:absl:block_name is not set. Please add the block_name in:\n",
-      "/home/ike2030/workspace/a2perf/repo_new/a2perf/domains/circuit_training/circuit_training/environment/test_data/toy_macro_stdcell/netlist.pb.txt\n",
-      "or in:\n",
-      "/home/ike2030/workspace/a2perf/repo_new/a2perf/domains/circuit_training/circuit_training/environment/test_data/toy_macro_stdcell/initial.plc\n",
-      "/home/ike2030/miniconda3/envs/a2perf_circuit_training/lib/python3.10/site-packages/numpy/core/fromnumeric.py:3432: RuntimeWarning: Mean of empty slice.\n",
-      "  return _methods._mean(a, axis=axis, dtype=dtype,\n",
-      "/home/ike2030/miniconda3/envs/a2perf_circuit_training/lib/python3.10/site-packages/numpy/core/_methods.py:190: RuntimeWarning: invalid value encountered in divide\n",
-      "  ret = ret.dtype.type(ret / rcount)\n",
-      "/home/ike2030/miniconda3/envs/a2perf_circuit_training/lib/python3.10/site-packages/gymnasium/utils/passive_env_checker.py:32: UserWarning: \u001b[33mWARN: A Box observation space maximum and minimum values are equal. Actual equal coordinates: [(0,)]\u001b[0m\n",
-      "  logger.warn(\n"
-     ]
-    }
-   ],
-   "source": [
-    "from a2perf.domains import circuit_training\n",
-    "import gymnasium as gym\n",
-    "\n",
-    "env = gym.make('CircuitTraining-ToyMacro-v0')"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-07-21T17:47:43.889997Z",
-     "start_time": "2024-07-21T17:47:43.885078Z"
-    }
-   },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "Dict('current_node': Box(0, 3499, (1,), int32), 'fake_net_heatmap': Box(0.0, 1.0, (16384,), float32), 'is_node_placed': Box(0, 1, (3500,), int32), 'locations_x': Box(0.0, 1.0, (3500,), float32), 'locations_y': Box(0.0, 1.0, (3500,), float32), 'mask': Box(0, 1, (16384,), int32), 'netlist_index': Box(0, 0, (1,), int32))"
-      ]
-     },
-     "execution_count": 4,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "env.observation_space"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 5,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-07-21T17:47:58.159889Z",
-     "start_time": "2024-07-21T17:47:58.157250Z"
-    }
-   },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "Discrete(16384)"
-      ]
-     },
-     "execution_count": 5,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "env.action_space"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<table>\n",
-    "    <tr>\n",
-    "        <th style=\"text-align:right\">Action Space</th>\n",
-    "        <td style=\"text-align:left\">Discrete(16384)</td>\n",
-    "    </tr>\n",
-    "    <tr>\n",
-    "        <th style=\"text-align:right\">Observation Space</th>\n",
-    "        <td style=\"text-align:left\">\n",
-    "            Dict('current_node': Box(0, 3499, (1,), int32), 'fake_net_heatmap': Box(0.0, 1.0, (16384,), float32), 'is_node_placed': Box(0, 1, (3500,), int32), 'locations_x': Box(0.0, 1.0, (3500,), float32), 'locations_y': Box(0.0, 1.0, (3500,), float32), 'mask': Box(0, 1, (16384,), int32), 'netlist_index': Box(0, 0, (1,), int32))\n",
-    "        </td>\n",
-    "    </tr>\n",
-    "    <tr>\n",
-    "        <th style=\"text-align:right\">Creation</th>\n",
-    "        <td style=\"text-align:left\">gym.make(\"CircuitTraining-ToyMacro-v0\")</td>\n",
-    "    </tr>\n",
-    "</table>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Description\n",
-    "\n",
-    "Circuit Training is an open-source framework for generating chip floor plans with distributed deep reinforcement learning. This framework reproduces the methodology published in the Nature 2021 paper:\n",
-    "\n",
-    "A graph placement methodology for fast chip design. Azalia Mirhoseini, Anna Goldie, Mustafa Yazgan, Joe Wenjie Jiang, Ebrahim Songhori, Shen Wang, Young-Joon Lee, Eric Johnson, Omkar Pathak, Azade Nazi, Jiwoo Pak, Andy Tong, Kavya Srinivasa, William Hang, Emre Tuncer, Quoc V. Le, James Laudon, Richard Ho, Roger Carpenter & Jeff Dean, 2021. Nature, 594(7862), pp.207-212. [PDF]\n",
-    "\n",
-    "At each timestep, the agent must place a single macro onto the chip canvas. \n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Action Space\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-07-21T17:51:19.077192Z",
-     "start_time": "2024-07-21T17:51:19.071196Z"
-    }
-   },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "Discrete(16384)"
-      ]
-     },
-     "execution_count": 7,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "env.action_space"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "\n",
-    "Circuit Training represents the chip canvas as a grid. The action space corresponds to the different locations that the next macro can be placed onto the canvas. In the Toy Macro netlist case, the canvas is of size $128 \\times 128$, resulting in $16384$ possible actions."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Observation Encoding\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 8,
-   "metadata": {
-    "ExecuteTime": {
-     "end_time": "2024-07-21T17:51:49.691864Z",
-     "start_time": "2024-07-21T17:51:49.683712Z"
-    }
-   },
-   "outputs": [
-    {
-     "data": {
-      "text/plain": [
-       "Dict('current_node': Box(0, 3499, (1,), int32), 'fake_net_heatmap': Box(0.0, 1.0, (16384,), float32), 'is_node_placed': Box(0, 1, (3500,), int32), 'locations_x': Box(0.0, 1.0, (3500,), float32), 'locations_y': Box(0.0, 1.0, (3500,), float32), 'mask': Box(0, 1, (16384,), int32), 'netlist_index': Box(0, 0, (1,), int32))"
-      ]
-     },
-     "execution_count": 8,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "env.observation_space"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "| Key | Description |\n",
-    "|-----|-------------|\n",
-    "| current_node | The node currently being considered for placement |\n",
-    "| fake_net_heatmap | A representation of estimated connections between nodes |\n",
-    "| is_node_placed | Indicates which nodes have already been placed on the chip |\n",
-    "| locations_x | The x-coordinates of placed nodes |\n",
-    "| locations_y | The y-coordinates of placed nodes |\n",
-    "| mask | Indicates which actions are valid in the current state |\n",
-    "| netlist_index | Identifier for the current netlist being processed |"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Rewards\n",
-    "\n",
-    "The reward is evaluated at the end of each episode. The placement cost binary is used to calculate the reward based on proxy wirelength, congestion, and density. An infeasible placement results in a reward of -1.0.\n",
-    "\n",
-    "The reward function is defined as:\n",
-    "\n",
-    "$$R(p, g) = -\\text{Wirelength}(p, g) - \\lambda \\cdot \\text{Congestion}(p, g) - \\gamma \\cdot \\text{Density}(p, g)$$\n",
-    "\n",
-    "Where:\n",
-    "- $p$ represents the placement\n",
-    "- $g$ represents the netlist graph\n",
-    "- $\\lambda$ is the congestion weight\n",
-    "- $\\gamma$ is the density weight\n",
-    "\n",
-    "Default values in A2Perf:\n",
-    "- The congestion weight $\\lambda$ is set to 0.01\n",
-    "- The density weight $\\gamma$ is set to 0.01 \n",
-    "- The maximum density threshold is set to 0.6\n",
-    "\n",
-    "These default values are based on the methodology described in [Mirhoseini et al. (2021)][1].\n",
-    "\n",
-    "[1]: https://www.nature.com/articles/s41586-021-03544-w \"A graph placement methodology for fast chip design\""
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Termination\n",
-    "\n",
-    "The episode is terminated once all macros have been placed on the canvas, then the final reward is calculated."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "## Registered Configurations\n",
-    "- `CircuitTraining-ToyMacro-v0`"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "name": "python"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/content/circuit_training/index.html b/content/circuit_training/index.html
index ba2ee07..f1c9275 100644
--- a/content/circuit_training/index.html
+++ b/content/circuit_training/index.html
@@ -220,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 current has-children current-page"><a class="current reference internal" href="#">Circuit Training Environments</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/content/publications/index.html b/content/publications/index.html
index 0c0c817..bba72c7 100644
--- a/content/publications/index.html
+++ b/content/publications/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0/index.html b/content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0/index.html
index 0fbf64d..d8a5745 100644
--- a/content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0/index.html
+++ b/content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0/index.html
@@ -220,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 current has-children"><a class="reference internal" href="../">Quadruped Locomotion Environments</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul class="current">
diff --git a/content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0/index.html b/content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0/index.html
index fb2cbd5..9df8740 100644
--- a/content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0/index.html
+++ b/content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0/index.html
@@ -220,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 current has-children"><a class="reference internal" href="../">Quadruped Locomotion Environments</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul class="current">
diff --git a/content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0/index.html b/content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0/index.html
index 3e30140..547b9b0 100644
--- a/content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0/index.html
+++ b/content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0/index.html
@@ -220,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 current has-children"><a class="reference internal" href="../">Quadruped Locomotion Environments</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul class="current">
diff --git a/content/quadruped_locomotion/index.html b/content/quadruped_locomotion/index.html
index 92cc7ea..9914c0d 100644
--- a/content/quadruped_locomotion/index.html
+++ b/content/quadruped_locomotion/index.html
@@ -8,7 +8,7 @@
     <meta property="og:type" content="website" />
     <meta property="og:description" content="A2Perf is a benchmarking suite for evaluating autonomous agents on real-world problems." />
     <meta property="og:url" content="https://a2perf.farama.org/content/quadruped_locomotion/index.html" /><meta property="og:image" content="https://a2perf.farama.org/_static/_static/img/logo/vectors/A2Perf-github.svg" /><meta name="twitter:card" content="summary_large_image"><meta name="viewport" content="width=device-width, initial-scale=1" />
-<link rel="index" title="Index" href="../../genindex/" /><link rel="search" title="Search" href="../../search/" /><link rel="next" title="Dog Pace" href="QuadrupedLocomotion-DogPace-v0/" /><link rel="prev" title="Toy Macro Standard Cell" href="../circuit_training/CircuitTraining-ToyMacroStdcell-v0/" />
+<link rel="index" title="Index" href="../../genindex/" /><link rel="search" title="Search" href="../../search/" /><link rel="next" title="Dog Pace" href="QuadrupedLocomotion-DogPace-v0/" /><link rel="prev" title="Ariane" href="../circuit_training/CircuitTraining-Ariane-v0/" />
         <link rel="canonical" href="https://a2perf.farama.org/content/quadruped_locomotion/index.html" />
 
     <link rel="shortcut icon" href="../../_static/A2Perf-favicon.png"/><!-- Generated with Sphinx 7.4.7 and Furo 2023.08.19.dev1 -->
@@ -220,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 has-children"><a class="reference internal" href="../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 current has-children current-page"><a class="current reference internal" href="#">Quadruped Locomotion Environments</a><input checked="" class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
@@ -367,7 +366,7 @@ <h1>Quadruped Locomotion Environments<a class="headerlink" href="#quadruped-loco
                 <use href="#svg-arrow-right"></use>
               </svg>
             </a>
-            <a class="prev-page" href="../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">
+            <a class="prev-page" href="../circuit_training/CircuitTraining-Ariane-v0/">
               <svg class="furo-related-icon">
                 <use href="#svg-arrow-right"></use>
               </svg>
@@ -376,7 +375,7 @@ <h1>Quadruped Locomotion Environments<a class="headerlink" href="#quadruped-loco
                   <span>Previous</span>
                 </div>
                 
-                <div class="title">Toy Macro Standard Cell</div>
+                <div class="title">Ariane</div>
                 
               </div>
             </a>
diff --git a/content/tutorials/add_domain/index.html b/content/tutorials/add_domain/index.html
index 1af0a4c..252a25f 100644
--- a/content/tutorials/add_domain/index.html
+++ b/content/tutorials/add_domain/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/content/tutorials/generalization/index.html b/content/tutorials/generalization/index.html
index 6ca2f76..76aff04 100644
--- a/content/tutorials/generalization/index.html
+++ b/content/tutorials/generalization/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/content/tutorials/inference/index.html b/content/tutorials/inference/index.html
index 356248e..bc8d671 100644
--- a/content/tutorials/inference/index.html
+++ b/content/tutorials/inference/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/content/tutorials/training/index.html b/content/tutorials/training/index.html
index f938e3b..6a06d26 100644
--- a/content/tutorials/training/index.html
+++ b/content/tutorials/training/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/content/web_navigation/WebNavigation-Difficulty-01-v0.ipynb b/content/web_navigation/WebNavigation-Difficulty-01-v0.ipynb
index a9444d4..b3499b7 100644
--- a/content/web_navigation/WebNavigation-Difficulty-01-v0.ipynb
+++ b/content/web_navigation/WebNavigation-Difficulty-01-v0.ipynb
@@ -4,7 +4,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# Web Navigation "
+    "# Web Navigation\n",
+    "\n",
+    "This environment is included in A2Perf.\n",
+    "\n",
+    "![The Ariane RISC-V CPU](../../../media/gminiwob_scene.png)"
    ]
   },
   {
diff --git a/content/web_navigation/WebNavigation-Difficulty-01-v0/index.html b/content/web_navigation/WebNavigation-Difficulty-01-v0/index.html
index ee8731e..38f5dc4 100644
--- a/content/web_navigation/WebNavigation-Difficulty-01-v0/index.html
+++ b/content/web_navigation/WebNavigation-Difficulty-01-v0/index.html
@@ -220,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
@@ -303,6 +302,8 @@
             
             <section id="Web-Navigation">
 <h1>Web Navigation<a class="headerlink" href="#Web-Navigation" title="Link to this heading">¶</a></h1>
+<p>This environment is included in A2Perf.</p>
+<p><img alt="The Ariane RISC-V CPU" src="../../../_images/gminiwob_scene.png" /></p>
 <section id="Description">
 <h2>Description<a class="headerlink" href="#Description" title="Link to this heading">¶</a></h2>
 <p>The web navigation environment aims at enabling the development of compositional tasks that can be represented by a dependency graph. Using Compositional Design of Environments (CoDE), propesed by Google Research in <a class="reference external" href="https://openreview.net/pdf?id=CeByDMy0YTL">‘Environment Generation for Zero-Shot Compositional Reinforcement Learning’</a>, websites are generated automatically, after which the policy has to complete the proposed webpages.</p>
diff --git a/content/web_navigation/index.html b/content/web_navigation/index.html
index 44e7935..df57326 100644
--- a/content/web_navigation/index.html
+++ b/content/web_navigation/index.html
@@ -220,7 +220,6 @@
 <ul class="current">
 <li class="toctree-l1 has-children"><a class="reference internal" href="../circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/genindex/index.html b/genindex/index.html
index e1a45b4..d5c8c82 100644
--- a/genindex/index.html
+++ b/genindex/index.html
@@ -218,7 +218,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/index.html b/index.html
index 1fff4aa..8ae2b16 100644
--- a/index.html
+++ b/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="content/circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="content/circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="content/quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/objects.inv b/objects.inv
index 0ad34c2..c108126 100644
Binary files a/objects.inv and b/objects.inv differ
diff --git a/release_notes/index.html b/release_notes/index.html
index 8e4e762..1657fcd 100644
--- a/release_notes/index.html
+++ b/release_notes/index.html
@@ -220,7 +220,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/search/index.html b/search/index.html
index 238613d..67653ef 100644
--- a/search/index.html
+++ b/search/index.html
@@ -217,7 +217,6 @@
 <ul>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/circuit_training/">Circuit Training Environments</a><input class="toctree-checkbox" id="toctree-checkbox-1" name="toctree-checkbox-1" role="switch" type="checkbox"/><label for="toctree-checkbox-1"><div class="visually-hidden">Toggle navigation of Circuit Training Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
 <li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-Ariane-v0/">Ariane</a></li>
-<li class="toctree-l2"><a class="reference internal" href="../content/circuit_training/CircuitTraining-ToyMacroStdcell-v0/">Toy Macro Standard Cell</a></li>
 </ul>
 </li>
 <li class="toctree-l1 has-children"><a class="reference internal" href="../content/quadruped_locomotion/">Quadruped Locomotion Environments</a><input class="toctree-checkbox" id="toctree-checkbox-2" name="toctree-checkbox-2" role="switch" type="checkbox"/><label for="toctree-checkbox-2"><div class="visually-hidden">Toggle navigation of Quadruped Locomotion Environments</div><i class="icon"><svg><use href="#svg-arrow-right"></use></svg></i></label><ul>
diff --git a/searchindex.js b/searchindex.js
index 1d237d9..4fc75eb 100644
--- a/searchindex.js
+++ b/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"alltitles": {"404 - Page Not Found": [[0, null]], "A2Perf documentation": [[1, null]], "Action Space": [[3, "Action-Space"], [4, "Action-Space"], [7, "Action-Space"], [8, "Action-Space"], [9, "Action-Space"], [15, "Action-Space"]], "Adding Custom Domains": [[11, null]], "Additional configurations": [[11, "additional-configurations"]], "Arguments": [[7, "Arguments"], [8, "Arguments"], [9, "Arguments"], [15, "Arguments"]], "Ariane": [[3, null]], "Back to the Main Directory": [[14, "back-to-the-main-directory"]], "Basic Usage": [[2, null]], "Benchmarking Generalization": [[12, null]], "Benchmarking Inference": [[13, null]], "Benchmarking Training": [[14, null]], "Benchmarking Training Tutorial": [[13, "benchmarking-training-tutorial"]], "Checkout the branch with code for baselines": [[14, "checkout-the-branch-with-code-for-baselines"]], "Circuit Training": [[2, "circuit-training"]], "Circuit Training Environments": [[5, null]], "Command Line Arguments": [[12, "command-line-arguments"], [12, "id1"]], "Command line arguments": [[13, "command-line-arguments"], [13, "id2"], [14, "command-line-arguments"], [14, "id2"]], "Creating a new domain": [[11, "creating-a-new-domain"]], "Description": [[3, "Description"], [4, "Description"], [7, "Description"], [8, "Description"], [9, "Description"], [15, "Description"]], "Dog Pace": [[7, null]], "Dog Spin": [[8, null]], "Dog Trot": [[9, null]], "Episode End": [[7, "Episode-End"], [8, "Episode-End"], [9, "Episode-End"], [15, "Episode-End"]], "Explanation of files:": [[14, "explanation-of-files"]], "Generalization Configuration": [[12, "generalization-configuration"]], "Install A2Perf": [[13, "install-a2perf"], [14, "install-a2perf"]], "Installation": [[2, "installation"]], "Installing Dependencies": [[13, "installing-dependencies"], [14, "installing-dependencies"]], "Installing from source": [[2, "installing-from-source"]], "List of Publications": [[6, null]], "Navigate to the Submodule Directory": [[14, "navigate-to-the-submodule-directory"]], "Observation Encoding": [[3, "Observation-Encoding"], [4, "Observation-Encoding"]], "Observation Space": [[7, "Observation-Space"], [8, "Observation-Space"], [9, "Observation-Space"], [15, "Observation-Space"]], "Optional parameters:": [[15, "Optional-parameters:"]], "Path to A2Perf Domains": [[11, "path-to-a2perf-domains"]], "Prerequisites": [[12, "prerequisites"], [13, "prerequisites"], [14, "prerequisites"]], "Proper Submission folder structure": [[14, "proper-submission-folder-structure"]], "Pull Latest Changes": [[14, "pull-latest-changes"]], "Quadruped Locomotion": [[2, "quadruped-locomotion"]], "Quadruped Locomotion Environments": [[10, null]], "Registered Configurations": [[3, "Registered-Configurations"], [4, "Registered-Configurations"]], "Release Notes": [[18, null]], "Required parameters:": [[15, "Required-parameters:"]], "Rewards": [[3, "Rewards"], [4, "Rewards"], [7, "Rewards"], [8, "Rewards"], [9, "Rewards"], [15, "Rewards"]], "Running Locally Without Docker": [[12, "running-locally-without-docker"], [13, "running-locally-without-docker"], [14, "running-locally-without-docker"]], "Running Locally with XManager (Docker)": [[12, "running-locally-with-xmanager-docker"]], "Running locally with XManager (Docker)": [[13, "running-locally-with-xmanager-docker"], [14, "running-locally-with-xmanager-docker"]], "Running the Benchmark": [[13, "running-the-benchmark"], [13, "id1"], [14, "running-the-benchmark"], [14, "id1"]], "Running the Generalization Benchmark": [[12, "running-the-generalization-benchmark"]], "Running the Inference Benchmark": [[13, "running-the-inference-benchmark"]], "Running the Training Benchmark": [[14, "running-the-training-benchmark"]], "Starting State": [[7, "Starting-State"], [8, "Starting-State"], [9, "Starting-State"], [15, "Starting-State"]], "Termination": [[3, "Termination"], [4, "Termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Toy Macro Standard Cell": [[4, null]], "Update the a2perf_benchmark_submission Submodule": [[13, "update-the-a2perf-benchmark-submission-submodule"], [14, "update-the-a2perf-benchmark-submission-submodule"]], "Version History": [[7, "Version-History"], [8, "Version-History"], [9, "Version-History"], [15, "Version-History"]], "Web Navigation": [[2, "web-navigation"], [15, null]], "Web Navigation Environments": [[16, null]]}, "docnames": ["404", "README", "content/basic_usage", "content/circuit_training/CircuitTraining-Ariane-v0", "content/circuit_training/CircuitTraining-ToyMacroStdcell-v0", "content/circuit_training/index", "content/publications", "content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0", "content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0", "content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0", "content/quadruped_locomotion/index", "content/tutorials/add_domain", "content/tutorials/generalization", "content/tutorials/inference", "content/tutorials/training", "content/web_navigation/WebNavigation-Difficulty-01-v0", "content/web_navigation/index", "index", "release_notes"], "envversion": {"nbsphinx": 4, "sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "content/basic_usage.md", "content/circuit_training/CircuitTraining-Ariane-v0.ipynb", "content/circuit_training/CircuitTraining-ToyMacroStdcell-v0.ipynb", "content/circuit_training/index.md", "content/publications.md", "content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0.ipynb", "content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0.ipynb", "content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0.ipynb", "content/quadruped_locomotion/index.md", "content/tutorials/add_domain.md", "content/tutorials/generalization.md", "content/tutorials/inference.md", "content/tutorials/training.md", "content/web_navigation/WebNavigation-Difficulty-01-v0.ipynb", "content/web_navigation/index.md", "index.md", "release_notes.md"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"": [7, 8, 9, 12, 13, 14, 15], "0": [3, 4, 7, 8, 9, 12, 14, 15], "01": [2, 3, 4, 17], "05": [7, 8, 9], "063385": 3, "07": 4, "08": 3, "1": [2, 3, 4, 7, 8, 9, 12, 13, 14, 15, 16], "10": [4, 7, 8, 9, 15], "100": 12, "1000": 17, "113": [3, 4], "12": [7, 8, 9], "128": [3, 4], "13": [3, 4], "14": 3, "15": 3, "1515": [3, 4], "15r": [7, 8, 9], "160": [7, 8, 9], "16384": [3, 4], "1724700456099": 14, "18": [7, 8, 9], "182": [3, 4], "190": 4, "197600": 3, "197668": 3, "1r": [7, 8, 9], "2": [3, 7, 8, 9, 15], "20": [7, 8, 9], "2021": [3, 4], "2024": [3, 4], "207": [3, 4], "21": 4, "212": [3, 4], "218491": 3, "25": 15, "269410": 3, "273879": 4, "299009": 4, "299034": 4, "2d": 15, "3": [3, 4, 7, 8, 9, 15], "300083": 4, "304647": 4, "30hz": [7, 8, 9], "32": 4, "3432": 4, "3499": [3, 4], "3500": [3, 4], "36": 4, "38": [3, 4], "39": [3, 4], "3d": [7, 8, 9, 15], "4": 4, "40": [3, 7, 8, 9], "42": 17, "47": 4, "5": [4, 7, 8, 9, 15], "50": 15, "594": [3, 4], "5d": 15, "5r": [7, 8, 9], "6": [3, 4, 7, 8, 9, 15], "607": [3, 4], "7": 4, "7862": [3, 4], "8": 4, "808584": 4, "9261": [3, 4], "963834": 3, "A": [3, 4, 7, 8, 9, 15], "At": [3, 4, 15], "For": [1, 7, 8, 9, 11, 13, 14, 15], "If": [2, 7, 8, 9, 13, 14, 15], "In": [3, 4, 11, 15], "It": [13, 14], "Or": 2, "The": [2, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "There": [7, 8, 9, 11], "These": [3, 4, 13, 15], "To": [2, 3, 4, 11, 14, 15], "_": [7, 8, 9, 17], "__init__": [11, 14], "_mean": 4, "_method": 4, "_t": [7, 8, 9], "a2perf": [2, 3, 4, 6, 12, 15, 17], "a2perf_benchmark_submiss": 12, "a2perf_circuit_train": 4, "a2perf_root": [13, 14], "abl": 2, "about": 1, "absl": 4, "abstract": 15, "access": 15, "accord": [13, 14], "across": [2, 12], "action": [14, 17], "action_spac": [3, 4, 17], "actor": 14, "actor_0": 14, "actor_1": 14, "actual": [4, 12, 13], "actuat": [7, 8, 9], "adapt": [12, 13], "add": [4, 6, 11], "addit": [12, 13, 14], "adjust": [13, 14], "after": [2, 7, 8, 9, 12, 13, 15], "again": 15, "agent": [3, 4, 11, 12, 13, 14, 15, 17], "aim": 15, "airport": 15, "al": [3, 4], "algorithm": 14, "all": [2, 3, 4, 7, 8, 9, 11, 14, 15], "allow": [7, 8, 9, 14, 15, 17], "alreadi": [3, 4, 13], "also": [11, 14], "an": [2, 3, 4, 7, 8, 9, 11, 14, 15], "andi": [3, 4], "angel": 15, "angl": [7, 8, 9], "angular": [7, 8, 9], "ani": [11, 14, 15], "anim": [7, 8, 9], "anna": [3, 4], "appli": [7, 8, 9], "apply_api_compat": 11, "approach": [7, 8, 9], "appropri": [3, 4], "ar": [2, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "arg": [12, 13, 14], "arian": [2, 5, 17], "arrai": [7, 8, 9, 15], "artifact": [12, 13, 14], "attempt": [3, 4], "attribut": 15, "automat": [7, 8, 9, 13, 14, 15], "avail": [2, 3, 4], "averag": 13, "avoid": [7, 8, 9], "avx2": [3, 4], "avx_vnni": [3, 4], "awar": 12, "axi": 4, "azad": [3, 4], "azalia": [3, 4], "b": 11, "b_navig": 15, "base": [3, 4, 7, 8, 9, 15], "base_url": 11, "base_url_path": 11, "baselin": 13, "basic": 14, "becaus": 14, "becom": 2, "been": [3, 4], "befor": [7, 8, 9, 12, 13, 14], "begin": [12, 13, 14], "behavior": [7, 8, 9], "being": [3, 4, 7, 8, 9, 14, 15], "benchmark": 17, "benchmarkdomain": [11, 12], "benchmarkmod": 12, "between": [3, 4, 7, 8, 9, 15], "binari": [3, 4], "block_nam": 4, "book": 15, "bool": [7, 8, 9, 15], "both": 15, "box": [3, 4, 7, 8, 9, 15], "branch": 13, "built": [7, 8, 9], "calcul": [3, 4, 15], "call": [11, 14], "camera": [7, 8, 9], "can": [2, 3, 4, 7, 8, 9, 12, 13, 14, 15], "canva": [3, 4], "captur": [7, 8, 9], "carpent": [3, 4], "case": [3, 4, 15], "cc": [3, 4], "cd": [2, 11, 13, 14], "cdot": [3, 4], "chanc": 15, "charact": 15, "checkout": 13, "checkpoint": 14, "chip": [3, 4, 17], "choos": 17, "circuit": [3, 4], "circuit_train": [3, 4, 11, 17], "circuittrain": [2, 3, 4, 11, 17], "class": [7, 8, 9, 11], "clean": 15, "clone": [2, 14], "close": 17, "code": [11, 12, 13, 15], "collect": [14, 17], "collect_polici": 14, "com": [2, 14], "come": 15, "command": 11, "commandlist": 11, "common": [7, 8, 9], "common_setup": 11, "compat": 2, "compil": [3, 4], "complet": [7, 8, 9, 12, 15], "composit": 15, "comput": [3, 4, 17], "conda": 2, "condit": [7, 8, 9, 15], "config": [12, 13, 14], "configur": [13, 14], "congest": [3, 4], "connect": [3, 4], "consid": [3, 4, 15], "consist": [7, 8, 9, 14], "constant": 11, "constants_from_enum": 11, "constraint": 14, "consumpt": 14, "contain": [1, 12, 13, 14, 15, 17], "content": 12, "context": 14, "contribut": 1, "control": [7, 8, 9], "convert": 15, "coordin": [3, 4], "core": [3, 4], "correct": 15, "correpsond": 15, "correspond": [3, 4, 7, 8, 9, 14, 15], "cost": [3, 4], "could": [3, 4, 15], "cpu": [3, 4, 12], "cpu_feature_guard": [3, 4], "creat": [7, 8, 9, 13, 14, 15], "creation": [3, 4], "critic": [3, 4], "csv": 14, "cubla": [3, 4], "cuda": [3, 4], "cuda_bla": [3, 4], "cuda_dnn": [3, 4], "cuda_fft": [3, 4], "cuda_visible_devic": 12, "cudnn": [3, 4], "cufft": [3, 4], "current": [3, 4, 11], "current_nod": [3, 4], "custom": [3, 4], "data": [7, 8, 9, 11, 14, 15], "data_dir": [11, 15], "date": 15, "dean": [3, 4], "debug": [7, 8, 9, 14], "decis": 17, "deep": [3, 4], "default": [3, 4, 7, 8, 9, 15], "defin": [3, 4, 12, 15], "degre": [7, 8, 9], "demonstr": 11, "denomin": 15, "densiti": [3, 4], "departur": 15, "depend": [2, 11, 15], "describ": [3, 4, 15], "design": [3, 4, 7, 8, 9, 15], "desir": [7, 8, 9, 15], "destin": 15, "detail": [13, 14], "develop": 15, "dict": [3, 4, 7, 8, 9, 11, 15], "dictionari": [11, 15], "differ": [2, 3, 4, 7, 8, 9, 12, 13, 14], "difficulti": [2, 15, 16, 17], "difficutli": 15, "dir": [12, 13, 14], "directli": [2, 15], "directori": [1, 11, 12, 13, 15], "disabl": [7, 8, 9], "disable_env_check": 11, "discret": [3, 4], "distribut": [3, 4], "div": 15, "divers": [7, 8, 9], "divid": [4, 15], "do": [2, 11], "docker": 11, "docker_instruct": 11, "docker_util": 11, "document": 14, "dof": [7, 8, 9], "dog": [10, 12, 13, 14], "dog_pac": [12, 13, 14], "dog_spin": 12, "dog_trot": 12, "dogpac": [2, 7, 12, 13, 14, 17], "dogspin": [2, 8], "dogtrot": [2, 9], "dom": 15, "dom_attribute_mask": 15, "dom_el": 15, "dom_elements_mask": 15, "dom_featur": 15, "dom_profile_intersect": 15, "dom_profile_intersection_mask": 15, "dom_profile_joint_mask": 15, "domain": [2, 3, 4, 7, 8, 9, 12, 13, 14, 15, 17], "done": [13, 14], "dot": [7, 8, 9], "dtype": 4, "due": [3, 4], "dure": [13, 14], "dynam": [7, 8, 9], "e": [2, 3, 4, 7, 8, 9, 11, 14, 15], "e_t": [7, 8, 9], "each": [3, 4, 7, 8, 9, 12, 13, 14, 15], "easili": 2, "ebrahim": [3, 4], "edit": 2, "effector": [7, 8, 9], "effici": 15, "eg": 15, "either": [7, 8, 9, 15], "element": 15, "element_index": 15, "els": [7, 8, 9, 15], "embed": 15, "emiss": 14, "empti": [4, 14, 15], "emr": [3, 4], "enabl": [3, 4, 7, 8, 9, 15], "enable_random": [7, 8, 9], "enable_rend": [7, 8, 9], "encod": 15, "encount": [4, 15], "encourag": [7, 8, 9, 15], "end": [3, 4, 14], "energi": 14, "ensur": [2, 12, 13, 14], "enter": 15, "entri": [6, 11], "entry_point": 11, "entrypoint": 11, "enum": 11, "env": [2, 3, 4, 7, 8, 9, 11, 14, 15, 17], "env_nam": 11, "environ": [2, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "environment_gener": [11, 15], "episod": [3, 4, 12], "equal": 4, "eric": [3, 4], "error": [3, 4], "estim": [3, 4], "et": [3, 4], "etc": [7, 8, 9, 15], "evalu": [3, 4, 12, 14, 17], "everi": [7, 8, 9, 15], "exampl": [2, 11, 13, 14, 15], "exce": 12, "execut": [12, 13], "exist": 11, "exp": [7, 8, 9], "expect": [7, 8, 9, 15], "experi": [12, 13, 14], "experiment_dir": [12, 13], "explicit": 14, "export": [13, 14], "extern": [3, 4], "extract": 15, "f": 11, "factori": [3, 4], "fake_net_heatmap": [3, 4], "fals": [7, 8, 9, 11, 12, 15], "farama": [2, 14], "fast": [3, 4], "faster": 12, "feed": 14, "fetch": [13, 14], "few": 15, "field": 15, "file": [11, 12, 13, 15], "fill": 15, "filter": [7, 8, 9], "final": [3, 4, 7, 8, 9, 15], "find": [3, 4, 11, 13, 14, 15], "first": 15, "firstli": 15, "fit": 14, "fix": 15, "flag": [2, 3, 4, 12], "flatten": 15, "flight": 15, "float": [3, 4, 7, 8, 9], "float32": [3, 4, 7, 8, 9], "floor": [3, 4], "floorplan": 17, "fma": [3, 4], "folder": 11, "follow": [2, 3, 4, 11, 12, 13, 14, 15, 17], "found": 13, "foundat": [2, 14], "framework": [3, 4, 7, 8, 9], "freedom": [7, 8, 9], "frequenc": [7, 8, 9], "fridai": 15, "from": [3, 4, 7, 8, 9, 12, 13, 14, 15, 17], "fromnumer": 4, "function": [3, 4, 7, 8, 9, 11, 14, 15], "g": [3, 4, 11, 14], "gamma": [3, 4], "gather": 15, "gc": [12, 13, 14], "gener": [3, 4, 13, 14, 15], "generalization_task": 12, "get": [7, 8, 9, 14], "get_act": [7, 8, 9], "get_docker_instruct": 11, "get_dom_el": 15, "get_entrypoint": 11, "get_observ": [7, 8, 9], "gin": [11, 12, 13, 14], "gin_config_path": 14, "git": [2, 13, 14], "github": [2, 14], "give": 15, "given": 15, "global": [7, 8, 9], "global_vocabulari": 15, "go": 1, "goldi": [3, 4], "googl": 15, "gpu": 12, "graph": [3, 4, 15], "greater": 15, "greedy_polici": [12, 13, 14], "grid": [3, 4], "guid": [12, 13, 14], "gwob": 11, "gym": [2, 3, 4, 7, 8, 9, 11, 15, 17], "gymnasium": [2, 3, 4, 7, 8, 9, 11, 15, 17], "ha": [3, 4, 7, 8, 9, 15], "hang": [3, 4], "hat": [7, 8, 9], "have": [3, 4, 7, 8, 9, 12, 13, 14, 15], "header": 15, "help": 12, "here": [2, 11, 12, 14], "highli": 2, "ho": [3, 4], "home": 4, "how": [1, 11, 12, 13, 14], "http": [2, 14], "i": [2, 3, 4, 7, 8, 9, 11, 13, 14, 15, 17], "id": [11, 12, 13, 14], "identifi": [3, 4, 14], "ike2030": 4, "imag": 15, "imit": [7, 8, 9], "implement": 14, "import": [2, 3, 4, 7, 8, 9, 11, 12, 14, 15, 17], "includ": [12, 13, 14], "indic": [3, 4, 12, 13, 14, 15], "infeas": [3, 4], "infer": [12, 14], "infer_onc": 14, "info": [15, 17], "inform": [1, 14, 15], "init": [2, 14], "initi": [4, 7, 8, 9, 14, 15, 17], "initial_motor_angl": [7, 8, 9], "insid": 11, "instal": [11, 12], "instanc": [7, 8, 9], "instanti": 2, "instruct": [3, 4, 11, 13, 14], "int": [7, 8, 9, 15], "int32": [3, 4], "interact": 17, "interfac": [7, 8, 9, 11, 17], "intersect": 15, "invalid": 4, "irrelev": 15, "is_node_plac": [3, 4], "its": [7, 8, 9, 12], "j": [7, 8, 9], "j_t": [7, 8, 9], "jame": [3, 4], "jeff": [3, 4], "jiang": [3, 4], "jiwoo": [3, 4], "joe": [3, 4], "johnson": [3, 4], "joint": [7, 8, 9], "joon": [3, 4], "json": 15, "kavya": [3, 4], "kei": [3, 4, 14, 15], "kwarg": [7, 8, 9, 11, 15], "laikago": [7, 8, 9], "laikagoposeoffsetgener": [7, 8, 9], "lambda": [3, 4], "last": 15, "lastli": 15, "later": 14, "laudon": [3, 4], "launch": [11, 12, 13, 14], "lax": 15, "le": [3, 4], "learn": [3, 4, 7, 8, 9, 15], "least": 15, "lee": [3, 4], "leg": [7, 8, 9], "length": 15, "level": [15, 16], "lib": 4, "librari": 17, "like": [7, 8, 9, 14], "limit": 15, "linear": [7, 8, 9, 15], "link": 15, "list": [7, 8, 9, 15], "ll": [2, 11], "lo": 15, "load": [12, 13, 14], "load_model": 14, "local_xla": [3, 4], "locat": [3, 4, 12, 13], "locations_i": [3, 4], "locations_x": [3, 4], "lockedthreadedvocabulari": 15, "locomot": [7, 8, 9, 12, 14, 17], "log": [12, 13, 14], "logger": 4, "logic": 14, "long": 14, "look": 14, "low": [7, 8, 9], "lsit": 15, "macro": [3, 5], "mai": [3, 4, 11, 14], "main": 11, "make": [2, 3, 4, 7, 8, 9, 13, 14, 15, 17], "manag": 2, "manual": 14, "mask": [3, 4, 15], "max": 15, "maximum": [3, 4, 15], "md": 1, "mean": 4, "measure_emiss": 12, "memori": 12, "method": [7, 8, 9, 15], "methodologi": [3, 4], "metric": [13, 14], "might": 12, "miniconda3": 4, "minimum": 4, "miniwobst": 15, "mirhoseini": [3, 4], "miss": 6, "mkdir": 11, "mode": [7, 8, 9, 12, 15], "model": 14, "modifi": [7, 8, 9, 14], "modul": [11, 12, 13, 14], "monitor": 14, "more": [1, 14, 15], "most": [7, 8, 9], "motion": [7, 8, 9], "motor": [7, 8, 9], "mpi": [7, 8, 9], "multipl": [12, 15], "must": [3, 4], "mustafa": [3, 4], "my_domain": 11, "mydomain": 11, "name": [11, 12, 13, 14, 15], "natur": [3, 4], "navig": [11, 17], "nazi": [3, 4], "necessari": [11, 13, 14], "need": [2, 7, 8, 9, 11, 14, 15], "netlist": [3, 4, 5], "netlist_index": [3, 4], "new": [13, 14], "next": [3, 4, 7, 8, 9, 14, 15], "node": [3, 4], "none": [7, 8, 9, 15], "note": [2, 11, 13, 14, 15], "notebook": 15, "now": 2, "num": 12, "num_generalization_episod": 12, "num_parallel_env": [7, 8, 9], "num_websit": [2, 15], "number": [7, 8, 9, 12, 14, 15], "number_of_dom_el": 15, "numer": [3, 4], "numpi": 4, "ob": 15, "object": [7, 8, 9, 14, 15], "observ": [14, 17], "observation_spac": [3, 4], "ocabulary_nod": 15, "off": [3, 4], "omit": 2, "omkar": [3, 4], "onc": [2, 3, 4, 13, 14], "one": [3, 4, 15, 17], "onednn": [3, 4], "ones": 15, "onli": [12, 15], "onto": [3, 4], "open": [3, 4, 6], "oper": [3, 4], "optim": [3, 4], "option": [7, 8, 9], "order": [3, 4], "origin": [13, 14, 15], "other": [2, 3, 4, 11, 13], "our": [1, 13, 14], "out": 15, "output": 13, "overlap": 15, "p": [3, 4], "p_t": [7, 8, 9], "pace": [10, 12, 13, 14], "packag": [2, 4, 14], "pad": 15, "page": 15, "pair": 15, "pak": [3, 4], "paper": [3, 4], "parallel": [7, 8, 9], "paramet": [7, 8, 9, 12, 14], "particip": [12, 13, 14], "pass": [7, 8, 9, 14, 15], "passive_env_check": 4, "path": [12, 13, 14, 15], "pathak": [3, 4], "pb": 4, "pd": [7, 8, 9], "pdf": [3, 4], "penalti": 15, "per": [7, 8, 9], "perform": [3, 4, 12, 13, 14, 15], "phrase": 15, "pi": [7, 8, 9], "pick": 15, "pip": [2, 13, 14], "pkg_resourc": 11, "place": [3, 4, 14], "placement": [3, 4], "plan": [3, 4], "platform": [3, 4], "plc": 4, "pleas": [4, 6, 13, 14], "plugin": [3, 4], "point": [3, 4, 12, 13, 14], "polici": [7, 8, 9, 12, 13, 14, 15, 17], "policy_nam": [12, 13], "porotationsit": [7, 8, 9], "port": [3, 4], "pose": [7, 8, 9], "posit": [7, 8, 9, 15], "possibl": [3, 4, 7, 8, 9, 15], "potenti": [7, 8, 9, 15], "pp": [3, 4], "ppo": 14, "predict": 14, "prefer": [13, 14], "preprocess": 14, "preprocess_observ": 14, "preview": 12, "problem": 17, "proce": 12, "process": [3, 4, 14], "profil": 15, "profile_index": 15, "profile_kei": 15, "profile_key_mask": 15, "profile_valu": 15, "profile_value_mask": 15, "progress": 14, "propes": 15, "propos": [7, 8, 9, 15], "provid": [7, 8, 9, 12, 13, 14, 15], "proxi": [3, 4], "publish": [3, 4], "pull": [6, 13], "purpos": [11, 14], "pwd": [13, 14], "py": [4, 11, 12, 13, 14], "py_util": [3, 4], "python": [13, 14], "python3": 4, "q": [7, 8, 9], "quadrup": [7, 8, 9, 12, 14, 17], "quadruped_locomot": [7, 8, 9, 11, 12, 13, 14, 17], "quadrupedlocomot": [2, 7, 8, 9, 11, 12, 13, 14, 17], "quickli": 14, "quoc": [3, 4], "r": [3, 4, 7, 8, 9, 13, 14], "r_t": [7, 8, 9], "rais": 15, "random": [7, 8, 9, 15], "randomli": 15, "rang": [3, 17], "rather": [7, 8, 9], "raw": 15, "raw_stat": 15, "rcount": 4, "reach": 15, "real": [7, 8, 9, 17], "rebuild": [3, 4], "receiv": 15, "recommend": 2, "recurs": 2, "refer": [7, 8, 9, 12, 13, 14, 15], "reflect": [7, 8, 9], "regist": 11, "reinforc": [3, 4, 15], "rel": [7, 8, 9], "relat": 15, "releas": [7, 8, 9, 15], "relev": 17, "remov": 12, "render": [7, 8, 9, 15], "render_mod": 15, "repertoir": [7, 8, 9], "replac": [12, 13, 17], "repo_new": 4, "repositori": [2, 14], "repres": [3, 4, 14, 15], "represent": [3, 4], "reproduc": [3, 4, 7, 8, 9], "request": 6, "requir": [13, 14], "research": 15, "reset": [7, 8, 9, 15, 17], "reset_dur": [7, 8, 9], "reset_visualization_camera": [7, 8, 9], "resourc": 13, "resource_filenam": 11, "respect": [7, 8, 9], "result": [3, 4, 12, 13], "ret": 4, "return": [4, 13, 14, 15], "reward": 17, "rgb_arrai": 15, "richard": [3, 4], "rl_perf": [7, 8, 9], "robot": [7, 8, 9], "robot_class": [7, 8, 9], "robust": [7, 8, 9, 12], "roger": [3, 4], "root": [7, 8, 9, 12, 13, 14, 15], "root_dir": [12, 13], "rotat": [7, 8, 9], "round": [3, 4], "rp": [7, 8, 9], "run": [7, 8, 9], "run_offline_metrics_onli": 12, "runtimewarn": 4, "rv": [7, 8, 9], "same": 12, "sampl": [15, 17], "save": [12, 13, 14, 15], "scalar": 15, "scenario": 12, "screenshot": 15, "second": [7, 8, 9], "secondli": 15, "section": 15, "see": [3, 4, 15], "seed": [7, 8, 9, 15, 17], "select": 15, "separ": 14, "sequenc": [7, 8, 9, 15], "sequenti": 17, "set": [3, 4, 11, 12], "setup": [12, 13, 14], "sever": [7, 8, 9, 14], "shape": 15, "shen": [3, 4], "shorter": 15, "shot": 15, "should": [2, 7, 8, 9, 14, 15], "show": [7, 8, 9], "similar": 13, "simpli": 14, "simplifi": 2, "singl": [3, 4, 7, 8, 9, 14], "site": 4, "size": [3, 4], "skill": [7, 8, 9], "slice": 4, "slightli": [3, 4], "small": 15, "smooth": [7, 8, 9], "so": 13, "some": 2, "songhori": [3, 4], "sourc": [3, 4], "spac": 15, "span": 17, "specif": [2, 7, 8, 9, 11, 12, 14], "specifi": [7, 8, 9, 12, 13, 14, 15], "spin": [10, 12], "srinivasa": [3, 4], "start": 14, "state": [3, 4], "step": [2, 7, 8, 9, 13, 14, 15, 17], "step_limit": 15, "store": [11, 14, 15], "str": [7, 8, 9, 15], "stream_executor": [3, 4], "string": 14, "structur": [13, 15], "subdirectori": 14, "submiss": [6, 12, 13], "submission_config": 14, "submission_util": 12, "submodul": 2, "subsequ": [14, 15], "success": 15, "successfulli": 15, "suit": 17, "suite_gym": 12, "sum_": [7, 8, 9], "summari": 14, "support": 14, "sure": [13, 14], "system": [2, 14], "t": 12, "taken": 15, "target": [7, 8, 9], "task": [7, 8, 9, 12, 15], "task1": 11, "task2": 11, "templat": 14, "tensor": 15, "tensorboard": 14, "tensorflow": [3, 4, 11, 14], "tensorrt": [3, 4], "termin": [15, 17], "test": [7, 8, 9, 12, 13, 14, 15], "test_data": 4, "test_infer": 13, "test_without_dock": 14, "text": [3, 4, 15], "tf": [3, 4], "tf2tensorrt": [3, 4], "tf_enable_onednn_opt": [3, 4], "tfa": [11, 12], "th": 15, "than": [7, 8, 9], "thei": [7, 8, 9, 13, 14], "them": [3, 4], "therefor": [7, 8, 9], "thi": [1, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "those": 13, "though": 15, "three": [7, 8, 9, 12], "threshold": [3, 4], "through": [7, 8, 9], "thu": 15, "time": [3, 4, 7, 8, 9, 13, 15], "time_step": 15, "timestep": [3, 4, 15], "toi": 5, "token": 15, "tong": [3, 4], "torso": [7, 8, 9], "toy_macro_stdcel": 4, "toymacro": [2, 4], "track": [7, 8, 9], "train": [3, 4, 7, 8, 9, 12], "train_emiss": 14, "training_complet": 14, "trajectory_gener": [7, 8, 9], "tree": [14, 15], "tri": 15, "trot": [10, 12], "trt": [3, 4], "true": [7, 8, 9, 15], "truncat": [15, 17], "tuncer": [3, 4], "tupl": 15, "turn": [3, 4], "tutori": [11, 12, 14], "two": [7, 8, 9, 15], "txt": [4, 13, 14], "type": [4, 7, 8, 9, 15], "typic": 14, "unabl": [3, 4], "under": [7, 8, 9, 15], "uniqu": [13, 14], "unit": 14, "unsaf": [7, 8, 9], "up": [11, 12], "updat": [2, 11], "upon": 15, "us": [2, 3, 4, 6, 7, 8, 9, 12, 13, 14, 15], "usag": 13, "use_conceptu": 15, "use_legacy_reset": [11, 15], "use_legacy_step": [11, 15], "user": [2, 12, 13, 14, 15, 17], "userwarn": 4, "util": [3, 4], "utter": 15, "v": [3, 4, 15], "v0": [2, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "v_t": [7, 8, 9], "valid": [3, 4], "valu": [3, 4, 7, 8, 9, 11, 15], "vari": [7, 8, 9], "variabl": [3, 4, 14], "vector": 15, "veloc": [7, 8, 9], "veri": [7, 8, 9], "version": [13, 14], "via": 14, "visual": [7, 8, 9], "vocabulari": 15, "w": [3, 4], "wa": [7, 8, 9], "wang": [3, 4], "warn": [3, 4], "wasn": 12, "we": [2, 7, 8, 9, 11, 13, 14, 15], "web": [11, 17], "web_navig": [11, 15, 17], "webnavig": [2, 11, 15, 17], "webnavigationenv": 11, "webpag": 15, "websit": 15, "websti": 15, "weight": [3, 4], "well": 12, "wenji": [3, 4], "when": [3, 4, 7, 8, 9, 11, 14, 15], "where": [3, 4, 7, 8, 9, 12, 13, 14, 15], "whether": [7, 8, 9], "which": [3, 4, 7, 8, 9, 12, 13, 14, 15], "while": 15, "william": [3, 4], "wirelength": [3, 4], "within": 12, "without": 15, "work": 14, "worker": [7, 8, 9], "workspac": 4, "world": [7, 8, 9, 17], "wrap": 15, "x": [3, 4, 7, 8, 9], "xla": [3, 4], "xm": 11, "xm_launch": [12, 13, 14], "y": [3, 4], "yazgan": [3, 4], "yet": 2, "you": [2, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15], "young": [3, 4], "your": [2, 11, 12, 13, 14, 17], "zero": 15, "zipfil": 15}, "titles": ["404 - Page Not Found", "A2Perf documentation", "Basic Usage", "Ariane", "Toy Macro Standard Cell", "Circuit Training Environments", "List of Publications", "Dog Pace", "Dog Spin", "Dog Trot", "Quadruped Locomotion Environments", "Adding Custom Domains", "Benchmarking Generalization", "Benchmarking Inference", "Benchmarking Training", "Web Navigation", "Web Navigation Environments", "&lt;no title&gt;", "Release Notes"], "titleterms": {"404": 0, "Not": 0, "The": 0, "a2perf": [1, 11, 13, 14], "a2perf_benchmark_submiss": [13, 14], "action": [3, 4, 7, 8, 9, 15], "ad": 11, "addit": 11, "argument": [7, 8, 9, 12, 13, 14, 15], "arian": 3, "back": 14, "baselin": 14, "basic": 2, "benchmark": [12, 13, 14], "branch": 14, "cell": 4, "chang": 14, "checkout": 14, "circuit": [2, 5], "code": 14, "command": [12, 13, 14], "configur": [3, 4, 11, 12], "could": 0, "creat": 11, "custom": 11, "depend": [13, 14], "descript": [3, 4, 7, 8, 9, 15], "directori": 14, "docker": [12, 13, 14], "document": 1, "dog": [7, 8, 9], "domain": 11, "encod": [3, 4], "end": [7, 8, 9, 15], "environ": [5, 10, 16], "episod": [7, 8, 9, 15], "explan": 14, "file": 14, "folder": 14, "found": 0, "from": 2, "gener": 12, "histori": [7, 8, 9, 15], "infer": 13, "instal": [2, 13, 14], "latest": 14, "line": [12, 13, 14], "list": 6, "local": [12, 13, 14], "locomot": [2, 10], "macro": 4, "main": 14, "navig": [2, 14, 15, 16], "new": 11, "note": 18, "observ": [3, 4, 7, 8, 9, 15], "option": 15, "pace": 7, "page": 0, "paramet": 15, "path": 11, "prerequisit": [12, 13, 14], "proper": 14, "public": 6, "pull": 14, "quadrup": [2, 10], "regist": [3, 4], "releas": 18, "request": 0, "requir": 15, "reward": [3, 4, 7, 8, 9, 15], "run": [12, 13, 14], "sourc": 2, "space": [3, 4, 7, 8, 9, 15], "spin": 8, "standard": 4, "start": [7, 8, 9, 15], "state": [7, 8, 9, 15], "structur": 14, "submiss": 14, "submodul": [13, 14], "termin": [3, 4], "toi": 4, "train": [2, 5, 13, 14], "trot": 9, "tutori": 13, "updat": [13, 14], "usag": 2, "version": [7, 8, 9, 15], "web": [2, 15, 16], "without": [12, 13, 14], "xmanag": [12, 13, 14]}})
\ No newline at end of file
+Search.setIndex({"alltitles": {"404 - Page Not Found": [[0, null]], "A2Perf documentation": [[1, null]], "Action Space": [[3, "action-space"], [4, "action-space"], [7, "Action-Space"], [8, "Action-Space"], [9, "Action-Space"], [15, "Action-Space"]], "Adding Custom Domains": [[11, null]], "Additional configurations": [[11, "additional-configurations"]], "Arguments": [[7, "Arguments"], [8, "Arguments"], [9, "Arguments"], [15, "Arguments"]], "Ariane": [[3, null], [4, null]], "Back to the Main Directory": [[14, "back-to-the-main-directory"]], "Basic Usage": [[2, null]], "Benchmarking Generalization": [[12, null]], "Benchmarking Inference": [[13, null]], "Benchmarking Training": [[14, null]], "Benchmarking Training Tutorial": [[13, "benchmarking-training-tutorial"]], "Checkout the branch with code for baselines": [[14, "checkout-the-branch-with-code-for-baselines"]], "Circuit Training": [[2, "circuit-training"]], "Circuit Training Environments": [[5, null]], "Command Line Arguments": [[12, "command-line-arguments"], [12, "id1"]], "Command line arguments": [[13, "command-line-arguments"], [13, "id2"], [14, "command-line-arguments"], [14, "id2"]], "Creating a new domain": [[11, "creating-a-new-domain"]], "Description": [[3, "description"], [4, "description"], [7, "Description"], [8, "Description"], [9, "Description"], [15, "Description"]], "Dog Pace": [[7, null]], "Dog Spin": [[8, null]], "Dog Trot": [[9, null]], "Environment Creation": [[3, "environment-creation"], [4, "environment-creation"]], "Episode End": [[3, "episode-end"], [4, "episode-end"], [7, "Episode-End"], [8, "Episode-End"], [9, "Episode-End"], [15, "Episode-End"]], "Explanation of files:": [[14, "explanation-of-files"]], "Generalization Configuration": [[12, "generalization-configuration"]], "Install A2Perf": [[13, "install-a2perf"], [14, "install-a2perf"]], "Installation": [[2, "installation"]], "Installing Dependencies": [[13, "installing-dependencies"], [14, "installing-dependencies"]], "Installing from PyPI": [[2, "installing-from-pypi"]], "Installing from source": [[2, "installing-from-source"]], "List of Publications": [[6, null]], "Navigate to the Submodule Directory": [[14, "navigate-to-the-submodule-directory"]], "Observation Space": [[3, "observation-space"], [4, "observation-space"], [7, "Observation-Space"], [8, "Observation-Space"], [9, "Observation-Space"], [15, "Observation-Space"]], "Optional parameters:": [[3, "optional-parameters"], [4, "optional-parameters"], [15, "Optional-parameters:"]], "Path to A2Perf Domains": [[11, "path-to-a2perf-domains"]], "Prerequisites": [[12, "prerequisites"], [13, "prerequisites"], [14, "prerequisites"]], "Proper Submission folder structure": [[14, "proper-submission-folder-structure"]], "Pull Latest Changes": [[14, "pull-latest-changes"]], "Quadruped Locomotion": [[2, "quadruped-locomotion"]], "Quadruped Locomotion Environments": [[10, null]], "Registered Configurations": [[3, "registered-configurations"], [4, "registered-configurations"]], "Release Notes": [[18, null]], "Required parameters:": [[15, "Required-parameters:"]], "Rewards": [[3, "rewards"], [4, "rewards"], [7, "Rewards"], [8, "Rewards"], [9, "Rewards"], [15, "Rewards"]], "Running Locally Without Docker": [[12, "running-locally-without-docker"], [13, "running-locally-without-docker"], [14, "running-locally-without-docker"]], "Running Locally with XManager (Docker)": [[12, "running-locally-with-xmanager-docker"]], "Running locally with XManager (Docker)": [[13, "running-locally-with-xmanager-docker"], [14, "running-locally-with-xmanager-docker"]], "Running the Benchmark": [[13, "running-the-benchmark"], [13, "id1"], [14, "running-the-benchmark"], [14, "id1"]], "Running the Generalization Benchmark": [[12, "running-the-generalization-benchmark"]], "Running the Inference Benchmark": [[13, "running-the-inference-benchmark"]], "Running the Training Benchmark": [[14, "running-the-training-benchmark"]], "Starting State": [[7, "Starting-State"], [8, "Starting-State"], [9, "Starting-State"], [15, "Starting-State"]], "Termination": [[3, "termination"], [4, "termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Update the a2perf_benchmark_submission Submodule": [[13, "update-the-a2perf-benchmark-submission-submodule"], [14, "update-the-a2perf-benchmark-submission-submodule"]], "Version History": [[7, "Version-History"], [8, "Version-History"], [9, "Version-History"], [15, "Version-History"]], "Web Navigation": [[2, "web-navigation"], [15, null]], "Web Navigation Environments": [[16, null]]}, "docnames": ["404", "README", "content/basic_usage", "content/circuit_training/CircuitTraining-Ariane-v0", "content/circuit_training/CircuitTraining-ToyMacro-v0", "content/circuit_training/index", "content/publications", "content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0", "content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0", "content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0", "content/quadruped_locomotion/index", "content/tutorials/add_domain", "content/tutorials/generalization", "content/tutorials/inference", "content/tutorials/training", "content/web_navigation/WebNavigation-Difficulty-01-v0", "content/web_navigation/index", "index", "release_notes"], "envversion": {"nbsphinx": 4, "sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "content/basic_usage.md", "content/circuit_training/CircuitTraining-Ariane-v0.md", "content/circuit_training/CircuitTraining-ToyMacro-v0.md", "content/circuit_training/index.md", "content/publications.md", "content/quadruped_locomotion/QuadrupedLocomotion-DogPace-v0.ipynb", "content/quadruped_locomotion/QuadrupedLocomotion-DogSpin-v0.ipynb", "content/quadruped_locomotion/QuadrupedLocomotion-DogTrot-v0.ipynb", "content/quadruped_locomotion/index.md", "content/tutorials/add_domain.md", "content/tutorials/generalization.md", "content/tutorials/inference.md", "content/tutorials/training.md", "content/web_navigation/WebNavigation-Difficulty-01-v0.ipynb", "content/web_navigation/index.md", "index.md", "release_notes.md"], "indexentries": {}, "objects": {}, "objnames": {}, "objtypes": {}, "terms": {"": [7, 8, 9, 12, 13, 14, 15], "0": [3, 4, 7, 8, 9, 12, 14, 15], "01": [2, 3, 4, 17], "05": [7, 8, 9], "1": [2, 3, 4, 7, 8, 9, 12, 13, 14, 15, 16], "10": [7, 8, 9, 15], "100": 12, "1000": 17, "12": [7, 8, 9], "15r": [7, 8, 9], "16": [3, 4], "160": [7, 8, 9], "1724700456099": 14, "18": [7, 8, 9], "1r": [7, 8, 9], "2": [7, 8, 9, 15], "20": [7, 8, 9], "2021": [3, 4], "207": [3, 4], "212": [3, 4], "25": 15, "2d": 15, "3": [7, 8, 9, 15], "30hz": [7, 8, 9], "3499": [3, 4], "3500": [3, 4], "384": [3, 4], "3d": [7, 8, 9, 15], "40": [7, 8, 9], "42": 17, "5": [7, 8, 9, 15], "50": 15, "594": [3, 4], "5d": 15, "5r": [7, 8, 9], "6": [3, 4, 7, 8, 9, 15], "7862": [3, 4], "A": [3, 4, 7, 8, 9, 15], "At": [3, 4, 15], "For": [1, 7, 8, 9, 11, 13, 14, 15], "If": [2, 3, 4, 7, 8, 9, 13, 14, 15], "In": [11, 15], "It": [13, 14], "Or": 2, "The": [3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "There": [7, 8, 9, 11], "These": [3, 4, 13, 15], "To": [2, 11, 14, 15], "_": [7, 8, 9, 17], "__init__": [11, 14], "_t": [7, 8, 9], "a2perf": [2, 3, 4, 6, 12, 15, 17], "a2perf_benchmark_submiss": 12, "a2perf_root": [13, 14], "about": [1, 3, 4], "abstract": 15, "access": 15, "accord": [13, 14], "across": [2, 3, 4, 12], "act": [3, 4], "action": [14, 17], "action_spac": 17, "actor": [3, 4, 14], "actor_0": 14, "actor_1": 14, "actual": [12, 13], "actuat": [7, 8, 9], "adapt": [12, 13], "add": [6, 11], "addit": [12, 13, 14], "adjust": [13, 14], "after": [2, 7, 8, 9, 12, 13, 15], "again": 15, "agent": [3, 4, 11, 12, 13, 14, 15, 17], "aim": 15, "airport": 15, "al": [3, 4], "algorithm": [3, 4, 14], "all": [2, 3, 4, 7, 8, 9, 11, 14, 15], "allow": [7, 8, 9, 14, 15, 17], "alreadi": 13, "also": [2, 3, 4, 11, 14], "an": [2, 3, 4, 7, 8, 9, 11, 14, 15], "andi": [3, 4], "angel": 15, "angl": [7, 8, 9], "angular": [7, 8, 9], "ani": [3, 4, 11, 14, 15], "anim": [7, 8, 9], "anna": [3, 4], "appli": [7, 8, 9], "apply_api_compat": 11, "approach": [7, 8, 9], "ar": [2, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "arg": [12, 13, 14], "arian": [2, 5, 17], "arrai": [3, 4, 7, 8, 9, 15], "artifact": [12, 13, 14], "attribut": 15, "automat": [7, 8, 9, 13, 14, 15], "avail": 2, "averag": 13, "avoid": [7, 8, 9], "awar": 12, "axi": [3, 4], "azad": [3, 4], "azalia": [3, 4], "b": 11, "b_navig": 15, "base": [3, 4, 7, 8, 9, 15], "base_url": 11, "base_url_path": 11, "baselin": 13, "basic": 14, "becaus": 14, "been": [3, 4], "befor": [7, 8, 9, 12, 13, 14], "begin": [12, 13, 14], "behavior": [7, 8, 9], "being": [7, 8, 9, 14, 15], "benchmark": 17, "benchmarkdomain": [11, 12], "benchmarkmod": 12, "better": [3, 4], "between": [3, 4, 7, 8, 9, 15], "bin": [3, 4], "binari": [3, 4], "blockag": [3, 4], "book": 15, "bool": [3, 4, 7, 8, 9, 15], "both": 15, "box": [7, 8, 9, 15], "branch": 13, "built": [7, 8, 9], "calcul": [3, 4, 15], "call": [11, 14], "callabl": [3, 4], "camera": [7, 8, 9], "can": [2, 3, 4, 7, 8, 9, 12, 13, 14, 15], "canva": [3, 4], "captur": [7, 8, 9], "carpent": [3, 4], "case": 15, "cd": [2, 11, 13, 14], "cd_finetun": [3, 4], "cd_plc_file": [3, 4], "cdot": [3, 4], "cell": [3, 4], "chanc": 15, "charact": 15, "checkout": 13, "checkpoint": 14, "chip": [3, 4, 17], "choos": 17, "circuit": [3, 4], "circuit_train": [3, 4, 11, 17], "circuittrain": [2, 3, 4, 11, 17], "class": [7, 8, 9, 11], "clean": 15, "clone": [2, 14], "close": 17, "cluster": [3, 4], "code": [11, 12, 13, 15], "collect": [14, 17], "collect_polici": 14, "com": [2, 14], "come": 15, "command": [2, 11], "commandlist": 11, "common": [7, 8, 9], "common_setup": 11, "compat": 2, "complet": [7, 8, 9, 12, 15], "composit": 15, "comput": 17, "conda": 2, "condit": [7, 8, 9, 15], "config": [12, 13, 14], "configur": [13, 14], "congest": [3, 4], "consid": 15, "consist": [3, 4, 7, 8, 9, 14], "constant": 11, "constants_from_enum": 11, "constraint": [3, 4, 14], "consumpt": 14, "contain": [1, 12, 13, 14, 15, 17], "content": 12, "context": 14, "continu": [3, 4], "contribut": 1, "control": [7, 8, 9], "convert": 15, "coordin": [3, 4], "correct": 15, "correpsond": 15, "correspond": [3, 4, 7, 8, 9, 14, 15], "cost": [3, 4], "cost_info_fn": [3, 4], "cost_info_funct": [3, 4], "could": 15, "cpu": 12, "creat": [3, 4, 7, 8, 9, 13, 14, 15], "create_placement_cost": [3, 4], "create_placement_cost_fn": [3, 4], "csv": 14, "cuda_visible_devic": 12, "current": [3, 4, 11], "current_nod": [3, 4], "data": [7, 8, 9, 11, 14, 15], "data_dir": [11, 15], "date": 15, "dean": [3, 4], "debug": [7, 8, 9, 14], "decis": 17, "deep": [3, 4], "default": [3, 4, 7, 8, 9, 15], "defin": [3, 4, 12, 15], "degre": [7, 8, 9], "demonstr": 11, "denomin": 15, "densiti": [3, 4], "departur": 15, "depend": [2, 11, 15], "descending_size_macro_first": [3, 4], "descent": [3, 4], "describ": [3, 4, 15], "design": [3, 4, 7, 8, 9, 15], "desir": [7, 8, 9, 15], "destin": 15, "detail": [13, 14], "develop": 15, "dict": [7, 8, 9, 11, 15], "dictionari": [11, 15], "differ": [2, 3, 4, 7, 8, 9, 12, 13, 14], "difficulti": [2, 15, 16, 17], "difficutli": 15, "dir": [12, 13, 14], "direct": [3, 4], "directli": 15, "directori": [1, 3, 4, 11, 12, 13, 15], "disabl": [7, 8, 9], "disable_env_check": 11, "distribut": [3, 4], "div": 15, "divers": [7, 8, 9], "divid": 15, "do": [2, 11], "docker": 11, "docker_instruct": 11, "docker_util": 11, "document": 14, "doe": [3, 4], "dof": [7, 8, 9], "dog": [10, 12, 13, 14], "dog_pac": [12, 13, 14], "dog_spin": 12, "dog_trot": 12, "dogpac": [2, 7, 12, 13, 14, 17], "dogspin": [2, 8], "dogtrot": [2, 9], "dom": 15, "dom_attribute_mask": 15, "dom_el": 15, "dom_elements_mask": 15, "dom_featur": 15, "dom_profile_intersect": 15, "dom_profile_intersection_mask": 15, "dom_profile_joint_mask": 15, "domain": [2, 3, 4, 7, 8, 9, 12, 13, 14, 15, 17], "done": [3, 4, 13, 14], "dot": [7, 8, 9], "dure": [3, 4, 13, 14], "dynam": [3, 4, 7, 8, 9], "e": [2, 7, 8, 9, 11, 14, 15], "e_t": [7, 8, 9], "each": [3, 4, 7, 8, 9, 12, 13, 14, 15], "easili": 2, "ebrahim": [3, 4], "edit": 2, "effector": [7, 8, 9], "effici": 15, "eg": 15, "either": [7, 8, 9, 15], "element": 15, "element_index": 15, "els": [7, 8, 9, 15], "embed": 15, "emiss": 14, "empti": [14, 15], "emr": [3, 4], "enabl": [7, 8, 9, 15], "enable_random": [7, 8, 9], "enable_rend": [7, 8, 9], "encod": [3, 4, 15], "encount": 15, "encourag": [7, 8, 9, 15], "end": 14, "energi": 14, "ensur": [2, 3, 4, 12, 13, 14], "enter": 15, "entri": [6, 11], "entry_point": 11, "entrypoint": 11, "enum": 11, "env": [2, 3, 4, 7, 8, 9, 11, 14, 15, 17], "env_nam": 11, "environ": [2, 7, 8, 9, 11, 12, 13, 14, 15, 17], "environment_gener": [11, 15], "episod": 12, "eric": [3, 4], "et": [3, 4], "etc": [7, 8, 9, 15], "evalu": [3, 4, 12, 14, 17], "even": [3, 4], "everi": [7, 8, 9, 15], "exampl": [2, 11, 13, 14, 15], "exce": 12, "execut": [12, 13], "exist": 11, "exp": [7, 8, 9], "expect": [7, 8, 9, 15], "experi": [12, 13, 14], "experiment_dir": [12, 13], "explicit": 14, "export": [13, 14], "extract": 15, "f": 11, "fake": [3, 4], "fake_net_heatmap": [3, 4], "fals": [3, 4, 7, 8, 9, 11, 12, 15], "farama": [2, 14], "fast": [3, 4], "faster": 12, "fd": [3, 4], "featur": [3, 4], "feed": 14, "fetch": [13, 14], "few": 15, "field": 15, "file": [3, 4, 11, 12, 13, 15], "fill": 15, "filter": [7, 8, 9], "final": [3, 4, 7, 8, 9, 15], "find": [11, 13, 14, 15], "fine": [3, 4], "first": 15, "firstli": 15, "fit": 14, "fix": [3, 4, 15], "flag": [2, 12], "flatten": 15, "flight": 15, "float": [7, 8, 9], "float32": [7, 8, 9], "floor": [3, 4], "floorplan": 17, "folder": 11, "follow": [2, 11, 12, 13, 14, 15, 17], "forc": [3, 4], "found": 13, "foundat": [2, 14], "framework": [3, 4, 7, 8, 9], "freedom": [7, 8, 9], "frequenc": [7, 8, 9], "fridai": 15, "from": [3, 4, 7, 8, 9, 12, 13, 14, 15, 17], "function": [3, 4, 7, 8, 9, 11, 14, 15], "g": [3, 4, 11, 14], "gamma": [3, 4], "gather": 15, "gc": [12, 13, 14], "gener": [3, 4, 13, 14, 15], "generalization_task": 12, "get": [7, 8, 9, 14], "get_act": [7, 8, 9], "get_docker_instruct": 11, "get_dom_el": 15, "get_entrypoint": 11, "get_observ": [7, 8, 9], "gin": [11, 12, 13, 14], "gin_config_path": 14, "git": [2, 13, 14], "github": [2, 14], "give": 15, "given": [3, 4, 15], "global": [3, 4, 7, 8, 9], "global_se": [3, 4], "global_vocabulari": 15, "go": 1, "goldi": [3, 4], "googl": 15, "gpu": 12, "graph": [3, 4, 15], "greater": 15, "greedy_polici": [12, 13, 14], "grid": [3, 4], "guid": [12, 13, 14], "gwob": 11, "gym": [2, 3, 4, 7, 8, 9, 11, 15, 17], "gymnasium": [2, 3, 4, 7, 8, 9, 11, 15, 17], "ha": [3, 4, 7, 8, 9, 15], "hang": [3, 4], "hard": [3, 4], "hat": [7, 8, 9], "have": [3, 4, 7, 8, 9, 12, 13, 14, 15], "header": 15, "heatmap": [3, 4], "help": 12, "here": [2, 11, 12, 14], "highli": 2, "ho": [3, 4], "how": [1, 11, 12, 13, 14], "http": [2, 14], "human": [3, 4], "i": [3, 4, 7, 8, 9, 11, 13, 14, 15, 17], "id": [11, 12, 13, 14], "identifi": 14, "imag": 15, "imit": [7, 8, 9], "implement": 14, "import": [2, 3, 4, 7, 8, 9, 11, 12, 14, 15, 17], "includ": [3, 4, 12, 13, 14, 15], "index": [3, 4], "indic": [3, 4, 12, 13, 14, 15], "infeas": [3, 4], "infer": [12, 14], "infer_onc": 14, "info": [15, 17], "inform": [1, 3, 4, 14, 15], "init": [2, 14], "init_plac": [3, 4], "initi": [3, 4, 7, 8, 9, 14, 15, 17], "initial_motor_angl": [7, 8, 9], "input": [3, 4], "insid": 11, "instal": [11, 12], "instanc": [7, 8, 9], "instanti": 2, "instruct": [11, 13, 14], "int": [3, 4, 7, 8, 9, 15], "integ": [3, 4], "interact": 17, "interfac": [7, 8, 9, 11, 17], "intersect": 15, "irrelev": 15, "is_ev": [3, 4], "is_node_plac": [3, 4], "its": [3, 4, 7, 8, 9, 12], "j": [7, 8, 9], "j_t": [7, 8, 9], "jame": [3, 4], "jeff": [3, 4], "jiang": [3, 4], "jiwoo": [3, 4], "joe": [3, 4], "johnson": [3, 4], "joint": [7, 8, 9], "joon": [3, 4], "json": 15, "kavya": [3, 4], "kei": [14, 15], "kwarg": [7, 8, 9, 11, 15], "laikago": [7, 8, 9], "laikagoposeoffsetgener": [7, 8, 9], "lambda": [3, 4], "last": 15, "lastli": 15, "later": 14, "laudon": [3, 4], "launch": [11, 12, 13, 14], "lax": 15, "le": [3, 4], "learn": [3, 4, 7, 8, 9, 15], "least": 15, "lee": [3, 4], "leg": [7, 8, 9], "legaci": [3, 4], "length": 15, "level": [15, 16], "librari": 17, "like": [7, 8, 9, 14], "limit": 15, "linear": [7, 8, 9, 15], "link": 15, "linux": [3, 4], "list": [7, 8, 9, 15], "ll": 11, "lo": 15, "load": [12, 13, 14], "load_model": 14, "locat": [3, 4, 12, 13], "locations_i": [3, 4], "locations_x": [3, 4], "lockedthreadedvocabulari": 15, "locomot": [7, 8, 9, 12, 14, 17], "log": [12, 13, 14], "logic": 14, "long": 14, "look": 14, "low": [7, 8, 9], "lsit": 15, "macro": [3, 4, 5], "mai": [11, 14], "main": [3, 4, 11], "make": [2, 3, 4, 7, 8, 9, 13, 14, 15, 17], "manag": 2, "manual": 14, "mask": [3, 4, 15], "max": 15, "maximum": [3, 4, 15], "md": 1, "meant": [3, 4], "measure_emiss": 12, "memori": 12, "method": [3, 4, 7, 8, 9, 15], "methodologi": [3, 4], "metric": [13, 14], "might": 12, "miniwobst": 15, "mirhoseini": [3, 4], "miss": 6, "mkdir": 11, "mode": [3, 4, 7, 8, 9, 12, 15], "model": [3, 4, 14], "modifi": [7, 8, 9, 14], "modul": [11, 12, 13, 14], "monitor": 14, "more": [1, 14, 15], "most": [7, 8, 9], "motion": [7, 8, 9], "motor": [7, 8, 9], "mpi": [7, 8, 9], "multipl": [12, 15], "must": [3, 4], "mustafa": [3, 4], "my_domain": 11, "mydomain": 11, "name": [2, 3, 4, 11, 12, 13, 14, 15], "natur": [3, 4], "navig": [11, 17], "nazi": [3, 4], "necessari": [11, 13, 14], "need": [2, 7, 8, 9, 11, 14, 15], "net": [3, 4], "netlist": [3, 4, 5], "netlist_fil": [3, 4], "netlist_index": [3, 4], "new": [13, 14], "next": [3, 4, 7, 8, 9, 14, 15], "node": [3, 4], "node_ord": [3, 4], "none": [3, 4, 7, 8, 9, 15], "note": [2, 3, 4, 11, 13, 14, 15], "notebook": 15, "num": 12, "num_generalization_episod": 12, "num_parallel_env": [7, 8, 9], "num_websit": [2, 15], "number": [7, 8, 9, 12, 14, 15], "number_of_dom_el": 15, "ob": 15, "object": [3, 4, 7, 8, 9, 14, 15], "observ": [14, 17], "ocabulary_nod": 15, "omit": 2, "omkar": [3, 4], "onc": [3, 4, 13, 14], "one": [15, 17], "ones": 15, "onli": [3, 4, 12, 15], "onto": [3, 4], "open": [3, 4, 6], "option": [7, 8, 9], "order": [3, 4], "orient": [3, 4], "origin": [13, 14, 15], "os": [3, 4], "other": [2, 11, 13], "otherwis": [3, 4], "our": [1, 13, 14], "out": 15, "output": [3, 4, 13], "output_all_featur": [3, 4], "output_dir": [3, 4], "output_plc_fil": [3, 4], "overlap": 15, "p": [3, 4], "p_t": [7, 8, 9], "pace": [10, 12, 13, 14], "packag": [2, 14], "pad": 15, "page": 15, "pair": 15, "pak": [3, 4], "paper": [3, 4], "parallel": [7, 8, 9], "paramet": [7, 8, 9, 12, 14], "partial": [3, 4], "particip": [12, 13, 14], "pass": [7, 8, 9, 14, 15], "path": [3, 4, 12, 13, 14, 15], "pathak": [3, 4], "pb": [3, 4], "pd": [7, 8, 9], "pdf": [3, 4], "penalti": 15, "per": [7, 8, 9], "perform": [12, 13, 14, 15], "phrase": 15, "pi": [7, 8, 9], "pick": 15, "pip": [2, 13, 14], "pkg_resourc": 11, "place": [3, 4, 14], "placehold": [3, 4], "placement": [3, 4], "placement_util": [3, 4], "placementcost": [3, 4], "plan": [3, 4], "plc": [3, 4], "plc_wrapper_main": [3, 4], "pleas": [6, 13, 14], "point": [3, 4, 12, 13, 14], "polici": [7, 8, 9, 12, 13, 14, 15, 17], "policy_nam": [12, 13], "porotationsit": [7, 8, 9], "pose": [7, 8, 9], "posit": [7, 8, 9, 15], "possibl": [7, 8, 9, 15], "potenti": [7, 8, 9, 15], "pp": [3, 4], "ppo": 14, "ppo_cd_plac": [3, 4], "predefin": [3, 4], "predict": 14, "prefer": [13, 14], "preprocess": 14, "preprocess_observ": 14, "preview": 12, "previous": [3, 4], "problem": 17, "proce": 12, "process": 14, "profil": 15, "profile_index": 15, "profile_kei": 15, "profile_key_mask": 15, "profile_valu": 15, "profile_value_mask": 15, "progress": 14, "propes": 15, "propos": [7, 8, 9, 15], "provid": [3, 4, 7, 8, 9, 12, 13, 14, 15], "proxi": [3, 4], "publish": [3, 4], "pull": [6, 13], "purpos": [11, 14], "pwd": [13, 14], "py": [11, 12, 13, 14], "python": [13, 14], "q": [7, 8, 9], "quadrup": [7, 8, 9, 12, 14, 17], "quadruped_locomot": [7, 8, 9, 11, 12, 13, 14, 17], "quadrupedlocomot": [2, 7, 8, 9, 11, 12, 13, 14, 17], "quickli": 14, "quoc": [3, 4], "r": [3, 4, 7, 8, 9, 13, 14], "r_t": [7, 8, 9], "rais": 15, "random": [7, 8, 9, 15], "randomli": 15, "rang": [3, 4, 17], "rather": [7, 8, 9], "raw": 15, "raw_stat": 15, "reach": 15, "read": [3, 4], "real": [7, 8, 9, 17], "receiv": 15, "recommend": 2, "recurs": 2, "refer": [7, 8, 9, 12, 13, 14, 15], "reflect": [7, 8, 9], "regist": 11, "reinforc": [3, 4, 15], "rel": [7, 8, 9], "relat": 15, "releas": [7, 8, 9, 15], "relev": 17, "remov": 12, "render": [3, 4, 7, 8, 9, 15], "render_mod": [3, 4, 15], "repertoir": [7, 8, 9], "replac": [12, 13, 17], "repositori": [2, 14], "repres": [3, 4, 14, 15], "represent": [3, 4], "reproduc": [3, 4, 7, 8, 9], "request": 6, "requir": [13, 14], "research": 15, "reset": [3, 4, 7, 8, 9, 15, 17], "reset_dur": [7, 8, 9], "reset_visualization_camera": [7, 8, 9], "resourc": 13, "resource_filenam": 11, "respect": [7, 8, 9], "result": [3, 4, 12, 13], "return": [3, 4, 13, 14, 15], "reward": 17, "rgb_arrai": [3, 4, 15], "richard": [3, 4], "rl": [3, 4], "rl_perf": [7, 8, 9], "robot": [7, 8, 9], "robot_class": [7, 8, 9], "robust": [7, 8, 9, 12], "roger": [3, 4], "root": [7, 8, 9, 12, 13, 14, 15], "root_dir": [12, 13], "rotat": [7, 8, 9], "rp": [7, 8, 9], "run": [2, 3, 4, 7, 8, 9], "run_offline_metrics_onli": 12, "rv": [7, 8, 9], "same": [3, 4, 12], "sampl": [15, 17], "save": [3, 4, 12, 13, 14, 15], "save_best_cost": [3, 4], "save_partial_plac": [3, 4], "save_snapshot": [3, 4], "scalar": 15, "scenario": 12, "screenshot": 15, "second": [7, 8, 9], "secondli": 15, "section": 15, "see": 15, "seed": [3, 4, 7, 8, 9, 15, 17], "select": 15, "separ": 14, "sequenc": [3, 4, 7, 8, 9, 15], "sequenti": 17, "set": [3, 4, 11, 12], "setup": [12, 13, 14], "sever": [7, 8, 9, 14], "shape": 15, "shen": [3, 4], "shorter": 15, "shot": 15, "should": [7, 8, 9, 14, 15], "show": [3, 4, 7, 8, 9], "similar": [3, 4, 13], "simpli": 14, "simplifi": 2, "singl": [3, 4, 7, 8, 9, 14], "size": [3, 4], "skill": [7, 8, 9], "small": 15, "smooth": [7, 8, 9], "snapshot": [3, 4], "so": 13, "some": 2, "songhori": [3, 4], "sourc": [3, 4], "spac": 15, "span": 17, "specif": [2, 7, 8, 9, 11, 12, 14], "specifi": [2, 3, 4, 7, 8, 9, 12, 13, 14, 15], "spin": [10, 12], "srinivasa": [3, 4], "standard": [3, 4], "start": 14, "static": [3, 4], "statu": [3, 4], "std_cell_placer_mod": [3, 4], "step": [2, 3, 4, 7, 8, 9, 13, 14, 15, 17], "step_limit": 15, "store": [11, 14, 15], "str": [3, 4, 7, 8, 9, 15], "string": 14, "structur": [13, 15], "subdirectori": 14, "submiss": [6, 12, 13], "submission_config": 14, "submission_util": 12, "submodul": 2, "subsequ": [14, 15], "success": 15, "successfulli": 15, "suit": 17, "suite_gym": 12, "sum_": [7, 8, 9], "summari": 14, "support": [3, 4, 14], "sure": [13, 14], "system": [2, 14], "t": 12, "taken": 15, "target": [7, 8, 9], "task": [7, 8, 9, 12, 15], "task1": 11, "task2": 11, "templat": 14, "tensor": 15, "tensorboard": 14, "tensorflow": [11, 14], "termin": [15, 17], "test": [7, 8, 9, 12, 13, 14, 15], "test_infer": 13, "test_without_dock": 14, "text": [3, 4, 15], "tf": [3, 4], "tfa": [11, 12], "th": 15, "than": [3, 4, 7, 8, 9], "thei": [7, 8, 9, 13, 14], "therefor": [7, 8, 9], "thi": [1, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "those": 13, "though": 15, "three": [7, 8, 9, 12], "threshold": [3, 4], "through": [7, 8, 9], "thu": 15, "time": [7, 8, 9, 13, 15], "time_step": 15, "timestep": [3, 4, 15], "toi": 5, "token": 15, "tong": [3, 4], "torso": [7, 8, 9], "toymacro": [2, 3, 4], "track": [7, 8, 9], "train": [3, 4, 7, 8, 9, 12], "train_emiss": 14, "train_step": [3, 4], "training_complet": 14, "trajectory_gener": [7, 8, 9], "tree": [14, 15], "tri": 15, "trot": [10, 12], "true": [3, 4, 7, 8, 9, 15], "truncat": [15, 17], "tuncer": [3, 4], "tune": [3, 4], "tupl": 15, "tutori": [11, 12, 14], "two": [7, 8, 9, 15], "txt": [3, 4, 13, 14], "type": [3, 4, 7, 8, 9, 15], "typic": 14, "under": [7, 8, 9, 15], "uniqu": [13, 14], "unit": 14, "unsaf": [7, 8, 9], "up": [11, 12], "updat": [2, 11], "upon": 15, "us": [2, 3, 4, 6, 7, 8, 9, 12, 13, 14, 15], "usabl": [3, 4], "usag": 13, "use_conceptu": 15, "use_legacy_reset": [3, 4, 11, 15], "use_legacy_step": [3, 4, 11, 15], "user": [12, 13, 14, 15, 17], "usual": [3, 4], "utter": 15, "v": [3, 4, 15], "v0": [2, 3, 4, 7, 8, 9, 11, 12, 13, 14, 15, 17], "v_t": [7, 8, 9], "valid": [3, 4], "valu": [3, 4, 7, 8, 9, 11, 15], "vari": [7, 8, 9], "variabl": [3, 4, 14], "vector": 15, "veloc": [7, 8, 9], "veri": [7, 8, 9], "version": [13, 14], "via": 14, "violat": [3, 4], "visual": [7, 8, 9], "vocabulari": 15, "wa": [7, 8, 9], "wang": [3, 4], "wasn": 12, "we": [2, 7, 8, 9, 11, 13, 14, 15], "web": [11, 17], "web_navig": [11, 15, 17], "webnavig": [2, 11, 15, 17], "webnavigationenv": 11, "webpag": 15, "websit": 15, "websti": 15, "weight": [3, 4], "well": 12, "wenji": [3, 4], "when": [3, 4, 7, 8, 9, 11, 14, 15], "where": [3, 4, 7, 8, 9, 12, 13, 14, 15], "whether": [3, 4, 7, 8, 9], "which": [3, 4, 7, 8, 9, 12, 13, 14, 15], "while": 15, "william": [3, 4], "wirelength": [3, 4], "within": 12, "without": [3, 4, 15], "work": 14, "worker": [7, 8, 9], "world": [7, 8, 9, 17], "wrap": 15, "wrapper": [3, 4], "x": [3, 4, 7, 8, 9], "xm": 11, "xm_launch": [12, 13, 14], "y": [3, 4], "yazgan": [3, 4], "you": [2, 7, 8, 9, 11, 12, 13, 14, 15], "young": [3, 4], "your": [2, 11, 12, 13, 14, 17], "zero": 15, "zipfil": 15}, "titles": ["404 - Page Not Found", "A2Perf documentation", "Basic Usage", "Ariane", "Ariane", "Circuit Training Environments", "List of Publications", "Dog Pace", "Dog Spin", "Dog Trot", "Quadruped Locomotion Environments", "Adding Custom Domains", "Benchmarking Generalization", "Benchmarking Inference", "Benchmarking Training", "Web Navigation", "Web Navigation Environments", "&lt;no title&gt;", "Release Notes"], "titleterms": {"404": 0, "Not": 0, "The": 0, "a2perf": [1, 11, 13, 14], "a2perf_benchmark_submiss": [13, 14], "action": [3, 4, 7, 8, 9, 15], "ad": 11, "addit": 11, "argument": [7, 8, 9, 12, 13, 14, 15], "arian": [3, 4], "back": 14, "baselin": 14, "basic": 2, "benchmark": [12, 13, 14], "branch": 14, "chang": 14, "checkout": 14, "circuit": [2, 5], "code": 14, "command": [12, 13, 14], "configur": [3, 4, 11, 12], "could": 0, "creat": 11, "creation": [3, 4], "custom": 11, "depend": [13, 14], "descript": [3, 4, 7, 8, 9, 15], "directori": 14, "docker": [12, 13, 14], "document": 1, "dog": [7, 8, 9], "domain": 11, "end": [3, 4, 7, 8, 9, 15], "environ": [3, 4, 5, 10, 16], "episod": [3, 4, 7, 8, 9, 15], "explan": 14, "file": 14, "folder": 14, "found": 0, "from": 2, "gener": 12, "histori": [7, 8, 9, 15], "infer": 13, "instal": [2, 13, 14], "latest": 14, "line": [12, 13, 14], "list": 6, "local": [12, 13, 14], "locomot": [2, 10], "main": 14, "navig": [2, 14, 15, 16], "new": 11, "note": 18, "observ": [3, 4, 7, 8, 9, 15], "option": [3, 4, 15], "pace": 7, "page": 0, "paramet": [3, 4, 15], "path": 11, "prerequisit": [12, 13, 14], "proper": 14, "public": 6, "pull": 14, "pypi": 2, "quadrup": [2, 10], "regist": [3, 4], "releas": 18, "request": 0, "requir": 15, "reward": [3, 4, 7, 8, 9, 15], "run": [12, 13, 14], "sourc": 2, "space": [3, 4, 7, 8, 9, 15], "spin": 8, "start": [7, 8, 9, 15], "state": [7, 8, 9, 15], "structur": 14, "submiss": 14, "submodul": [13, 14], "termin": [3, 4], "train": [2, 5, 13, 14], "trot": 9, "tutori": 13, "updat": [13, 14], "usag": 2, "version": [7, 8, 9, 15], "web": [2, 15, 16], "without": [12, 13, 14], "xmanag": [12, 13, 14]}})
\ No newline at end of file

Action Space	Discrete(16384)
Observation Space	\n", - " Dict('current_node': Box(0, 3499, (1,), int32), 'fake_net_heatmap': Box(0.0, 1.0, (16384,), float32), 'is_node_placed': Box(0, 1, (3500,), int32), 'locations_x': Box(0.0, 1.0, (3500,), float32), 'locations_y': Box(0.0, 1.0, (3500,), float32), 'mask': Box(0, 1, (16384,), int32), 'netlist_index': Box(0, 0, (1,), int32))\n", - "
Reward Range	(0, 1)
Creation	gym.make(\"CircuitTraining-Ariane-v0\")
Action Space -	Discrete(16384) -
Observation Space -	Dict(‘current_node’: Box(0, 3499, (1,), int32), ‘fake_net_heatmap’: Box(0.0, 1.0, (16384,), float32), ‘is_node_placed’: Box(0, 1, (3500,), int32), ‘locations_x’: Box(0.0, 1.0, (3500,), float32), ‘locations_y’: Box(0.0, 1.0, (3500,), float32), ‘mask’: Box(0, 1, (16384,), int32), ‘netlist_index’: Box(0, 0, (1,), int32)) -
Reward Range -	(0, 1) -
Creation -	gym.make(“CircuitTraining-Ariane-v0”) -
Key
Parameter	Type	Default	Description
current_node	The node currently being considered for placement
`netlist_file`	str	path to `netlist.pb.txt`	Path to the input netlist file. Predefined by using `Ariane` or `ToyMacro`.
`init_placement`	str	path to `initial.plc`	Path to the input initial placement file, used to read grid and canvas size. Predefined by using `Ariane` or `ToyMacro`.
`plc_wrapper_main`	str	`a2perf/domains/circuit_training/bin/plc_wrapper_main`	Main PLC wrapper.
fake_net_heatmap	A representation of estimated connections between nodes
`create_placement_cost_fn`	Callable	`placement_util.create_placement_cost`	A function that creates the `PlacementCost` object given the netlist and initial placement file.
is_node_placed	Indicates which nodes have already been placed on the chip
`std_cell_placer_mode`	str	`'fd'`	Options for fast standard cells placement. The `fd` option uses the force-directed algorithm.
locations_x	The x-coordinates of placed nodes
`cost_info_fn`	Callable	`cost_info_function`	The cost function that, given the `plc` object, returns the RL cost.
locations_y	The y-coordinates of placed nodes
`global_seed`	int	`0`	Global seed for initializing environment features, ensuring consistency across actors.
mask	Indicates which actions are valid in the current state
`netlist_index`	int	`0`	Netlist index in the model static features.
netlist_index	Identifier for the current netlist being processed
`is_eval`	bool	`False`	If set, saves the final placement in `output_dir`.
`save_best_cost`	bool	`False`	If set, saves the placement if its cost is better than the previously saved placement.
`output_plc_file`	str	`''`	The path to save the final placement.
`cd_finetune`	bool	`False`	If True, runs coordinate descent to fine-tune macro orientations. Meant for evaluation, not training.
`cd_plc_file`	str	`'ppo_cd_placement.plc'`	Name of the coordinate descent fine-tuned `plc` file, saved in the same directory as `output_plc_file`.
`train_step`	Optional[tf.Variable]	`None`	A `tf.Variable` indicating the training step, used for saving `plc` files during evaluation.
`output_all_features`	bool	`False`	If true, outputs all observation features. Otherwise, only outputs dynamic observations.
`node_order`	str	`'descending_size_macro_first'`	The sequence order of nodes placed by RL.
`save_snapshot`	bool	`True`	If true, saves the snapshot placement.
`save_partial_placement`	bool	`False`	If true, evaluation also saves the placement even if RL does not place all nodes when an episode is done.
`use_legacy_reset`	bool	`False`	If true, uses the legacy reset method.
`use_legacy_step`	bool	`False`	If true, uses the legacy step method.
`render_mode`	str	`None`	Specifies the rendering mode `human` or `rgb_array`, if any.