226 lines
11 KiB
HTML
226 lines
11 KiB
HTML
|
<!DOCTYPE html>
|
||
|
<html class="writer-html5" lang="en" >
|
||
|
<head>
|
||
|
<meta charset="utf-8" /><meta name="generator" content="Docutils 0.19: https://docutils.sourceforge.io/" />
|
||
|
|
||
|
<meta name="viewport" content="width=device-width, initial-scale=1.0" />
|
||
|
<title>Classic Control — Fancy Gym 0.2 documentation</title>
|
||
|
<link rel="stylesheet" href="../../_static/pygments.css" type="text/css" />
|
||
|
<link rel="stylesheet" href="../../_static/css/theme.css" type="text/css" />
|
||
|
<link rel="stylesheet" href="../../_static/style.css" type="text/css" />
|
||
|
<link rel="shortcut icon" href="../../_static/icon.svg"/>
|
||
|
<!--[if lt IE 9]>
|
||
|
<script src="../../_static/js/html5shiv.min.js"></script>
|
||
|
<![endif]-->
|
||
|
|
||
|
<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js"></script>
|
||
|
<script src="../../_static/jquery.js"></script>
|
||
|
<script src="../../_static/underscore.js"></script>
|
||
|
<script src="../../_static/_sphinx_javascript_frameworks_compat.js"></script>
|
||
|
<script src="../../_static/doctools.js"></script>
|
||
|
<script src="../../_static/sphinx_highlight.js"></script>
|
||
|
<script src="../../_static/js/theme.js"></script>
|
||
|
<link rel="index" title="Index" href="../../genindex.html" />
|
||
|
<link rel="search" title="Search" href="../../search.html" />
|
||
|
<link rel="next" title="DeepMind Control (DMC)" href="../dmc.html" />
|
||
|
<link rel="prev" title="AirHockey" href="airhockey.html" />
|
||
|
|
||
|
|
||
|
</head>
|
||
|
|
||
|
<body class="wy-body-for-nav">
|
||
|
<div class="wy-grid-for-nav">
|
||
|
<nav data-toggle="wy-nav-shift" class="wy-nav-side">
|
||
|
<div class="wy-side-scroll">
|
||
|
<div class="wy-side-nav-search" >
|
||
|
|
||
|
|
||
|
|
||
|
<a href="../../index.html" class="icon icon-home">
|
||
|
Fancy Gym
|
||
|
<img src="../../_static/icon.svg" class="logo" alt="Logo"/>
|
||
|
</a>
|
||
|
<div class="version">
|
||
|
0.2
|
||
|
</div>
|
||
|
<div role="search">
|
||
|
<form id="rtd-search-form" class="wy-form" action="../../search.html" method="get">
|
||
|
<input type="text" name="q" placeholder="Search docs" aria-label="Search docs" />
|
||
|
<input type="hidden" name="check_keywords" value="yes" />
|
||
|
<input type="hidden" name="area" value="default" />
|
||
|
</form>
|
||
|
</div>
|
||
|
</div><div class="wy-menu wy-menu-vertical" data-spy="affix" role="navigation" aria-label="Navigation menu">
|
||
|
<p class="caption" role="heading"><span class="caption-text">User Guide</span></p>
|
||
|
<ul>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../guide/installation.html">Installation</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../guide/episodic_rl.html">What is Episodic RL?</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../guide/basic_usage.html">Basic Usage</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../guide/upgrading_envs.html">Creating new MP Environments</a></li>
|
||
|
</ul>
|
||
|
<p class="caption" role="heading"><span class="caption-text">Environments</span></p>
|
||
|
<ul class="current">
|
||
|
<li class="toctree-l1 current"><a class="reference internal" href="index.html">Fancy</a><ul class="current">
|
||
|
<li class="toctree-l2"><a class="reference internal" href="mujoco.html">Mujoco</a></li>
|
||
|
<li class="toctree-l2"><a class="reference internal" href="airhockey.html">AirHockey</a></li>
|
||
|
<li class="toctree-l2 current"><a class="current reference internal" href="#">Classic Control</a><ul>
|
||
|
<li class="toctree-l3"><a class="reference internal" href="#step-based-environments">Step-based Environments</a></li>
|
||
|
<li class="toctree-l3"><a class="reference internal" href="#mp-environments">MP Environments</a></li>
|
||
|
</ul>
|
||
|
</li>
|
||
|
</ul>
|
||
|
</li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../dmc.html">DeepMind Control (DMC)</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../meta.html">Metaworld</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../open_ai.html">Gymnasium</a></li>
|
||
|
</ul>
|
||
|
<p class="caption" role="heading"><span class="caption-text">Examples</span></p>
|
||
|
<ul>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/general.html">General Usage Examples</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/dmc.html">DeepMind Control Examples</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/metaworld.html">Metaworld Examples</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/open_ai.html">OpenAI Envs Examples</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/movement_primitives.html">Movement Primitives Examples</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/mp_params_tuning.html">MP Params Tuning Example</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/pd_control_gain_tuning.html">PD Control Gain Tuning Example</a></li>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../examples/replanning_envs.html">Replanning Example</a></li>
|
||
|
</ul>
|
||
|
<p class="caption" role="heading"><span class="caption-text">API</span></p>
|
||
|
<ul>
|
||
|
<li class="toctree-l1"><a class="reference internal" href="../../api.html">API</a></li>
|
||
|
</ul>
|
||
|
|
||
|
</div>
|
||
|
</div>
|
||
|
</nav>
|
||
|
|
||
|
<section data-toggle="wy-nav-shift" class="wy-nav-content-wrap"><nav class="wy-nav-top" aria-label="Mobile navigation menu" >
|
||
|
<i data-toggle="wy-nav-top" class="fa fa-bars"></i>
|
||
|
<a href="../../index.html">Fancy Gym</a>
|
||
|
</nav>
|
||
|
|
||
|
<div class="wy-nav-content">
|
||
|
<div class="rst-content">
|
||
|
<div role="navigation" aria-label="Page navigation">
|
||
|
<ul class="wy-breadcrumbs">
|
||
|
<li><a href="../../index.html" class="icon icon-home" aria-label="Home"></a></li>
|
||
|
<li class="breadcrumb-item"><a href="index.html">Fancy</a></li>
|
||
|
<li class="breadcrumb-item active">Classic Control</li>
|
||
|
<li class="wy-breadcrumbs-aside">
|
||
|
<a href="https://github.com/ALRhub/fancy_gym/blob/release/docs/source/envs/fancy/classic_control.md" class="fa fa-github"> Edit on GitHub</a>
|
||
|
</li>
|
||
|
</ul>
|
||
|
<hr/>
|
||
|
</div>
|
||
|
<div role="main" class="document" itemscope="itemscope" itemtype="http://schema.org/Article">
|
||
|
<div itemprop="articleBody">
|
||
|
|
||
|
<section id="classic-control">
|
||
|
<h1>Classic Control<a class="headerlink" href="#classic-control" title="Permalink to this heading"></a></h1>
|
||
|
<p>Classic Control environments provide a foundational platform for exploring and experimenting with RL algorithms. These environments are designed to be simple, allowing researchers and practitioners to focus on the fundamental principles of control without the complexities of high-dimensional and physics-based simulations.</p>
|
||
|
<section id="step-based-environments">
|
||
|
<h2>Step-based Environments<a class="headerlink" href="#step-based-environments" title="Permalink to this heading"></a></h2>
|
||
|
<table class="docutils align-default">
|
||
|
<thead>
|
||
|
<tr class="row-odd"><th class="head"><p>Name</p></th>
|
||
|
<th class="head"><p>Description</p></th>
|
||
|
<th class="head"><p>Horizon</p></th>
|
||
|
<th class="head"><p>Action Dimension</p></th>
|
||
|
<th class="head"><p>Observation Dimension</p></th>
|
||
|
</tr>
|
||
|
</thead>
|
||
|
<tbody>
|
||
|
<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">fancy/SimpleReacher-v0</span></code></p></td>
|
||
|
<td><p>Simple reaching task (2 links) without any physics simulation. Provides no reward until 150 time steps. This allows the agent to explore the space, but requires precise actions towards the end of the trajectory.</p></td>
|
||
|
<td><p>200</p></td>
|
||
|
<td><p>2</p></td>
|
||
|
<td><p>9</p></td>
|
||
|
</tr>
|
||
|
<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">fancy/LongSimpleReacher-v0</span></code></p></td>
|
||
|
<td><p>Simple reaching task (5 links) without any physics simulation. Provides no reward until 150 time steps. This allows the agent to explore the space, but requires precise actions towards the end of the trajectory.</p></td>
|
||
|
<td><p>200</p></td>
|
||
|
<td><p>5</p></td>
|
||
|
<td><p>18</p></td>
|
||
|
</tr>
|
||
|
<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">fancy/ViaPointReacher-v0</span></code></p></td>
|
||
|
<td><p>Simple reaching task leveraging a via point, which supports self collision detection. Provides a reward only at 100 and 199 for reaching the viapoint and goal point, respectively.</p></td>
|
||
|
<td><p>200</p></td>
|
||
|
<td><p>5</p></td>
|
||
|
<td><p>18</p></td>
|
||
|
</tr>
|
||
|
<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">fancy/HoleReacher-v0</span></code></p></td>
|
||
|
<td><p>5 link reaching task where the end-effector needs to reach into a narrow hole without collding with itself or walls.</p></td>
|
||
|
<td><p>200</p></td>
|
||
|
<td><p>5</p></td>
|
||
|
<td><p>18</p></td>
|
||
|
</tr>
|
||
|
</tbody>
|
||
|
</table>
|
||
|
</section>
|
||
|
<section id="mp-environments">
|
||
|
<h2>MP Environments<a class="headerlink" href="#mp-environments" title="Permalink to this heading"></a></h2>
|
||
|
<table class="docutils align-default">
|
||
|
<thead>
|
||
|
<tr class="row-odd"><th class="head"><p>Name</p></th>
|
||
|
<th class="head"><p>Description</p></th>
|
||
|
<th class="head"><p>Horizon</p></th>
|
||
|
<th class="head"><p>Action Dimension</p></th>
|
||
|
<th class="head"><p>Context Dimension</p></th>
|
||
|
</tr>
|
||
|
</thead>
|
||
|
<tbody>
|
||
|
<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">fancy_DMP/ViaPointReacher-v0</span></code></p></td>
|
||
|
<td><p>A DMP provides a trajectory for the <code class="docutils literal notranslate"><span class="pre">fancy/ViaPointReacher-v0</span></code> task.</p></td>
|
||
|
<td><p>200</p></td>
|
||
|
<td><p>25</p></td>
|
||
|
<td><p></p></td>
|
||
|
</tr>
|
||
|
<tr class="row-odd"><td><p><code class="docutils literal notranslate"><span class="pre">fancy_DMP/HoleReacherFixedGoal-v0</span></code></p></td>
|
||
|
<td><p>A DMP provides a trajectory for the <code class="docutils literal notranslate"><span class="pre">fancy/HoleReacher-v0</span></code> task with a fixed goal attractor.</p></td>
|
||
|
<td><p>200</p></td>
|
||
|
<td><p>25</p></td>
|
||
|
<td><p></p></td>
|
||
|
</tr>
|
||
|
<tr class="row-even"><td><p><code class="docutils literal notranslate"><span class="pre">fancy_DMP/HoleReacher-v0</span></code></p></td>
|
||
|
<td><p>A DMP provides a trajectory for the <code class="docutils literal notranslate"><span class="pre">fancy/HoleReacher-v0</span></code> task. The goal attractor needs to be learned.</p></td>
|
||
|
<td><p>200</p></td>
|
||
|
<td><p>30</p></td>
|
||
|
<td><p></p></td>
|
||
|
</tr>
|
||
|
</tbody>
|
||
|
</table>
|
||
|
</section>
|
||
|
</section>
|
||
|
|
||
|
|
||
|
</div>
|
||
|
</div>
|
||
|
<footer><div class="rst-footer-buttons" role="navigation" aria-label="Footer">
|
||
|
<a href="airhockey.html" class="btn btn-neutral float-left" title="AirHockey" accesskey="p" rel="prev"><span class="fa fa-arrow-circle-left" aria-hidden="true"></span> Previous</a>
|
||
|
<a href="../dmc.html" class="btn btn-neutral float-right" title="DeepMind Control (DMC)" accesskey="n" rel="next">Next <span class="fa fa-arrow-circle-right" aria-hidden="true"></span></a>
|
||
|
</div>
|
||
|
|
||
|
<hr/>
|
||
|
|
||
|
<div role="contentinfo">
|
||
|
<p>© Copyright 2020-2024, Fabian Otto, Onur Celik, Dominik Roth, Hongyi Zhou.</p>
|
||
|
</div>
|
||
|
|
||
|
Built with <a href="https://www.sphinx-doc.org/">Sphinx</a> using a
|
||
|
<a href="https://github.com/readthedocs/sphinx_rtd_theme">theme</a>
|
||
|
provided by <a href="https://readthedocs.org">Read the Docs</a>.
|
||
|
|
||
|
|
||
|
</footer>
|
||
|
</div>
|
||
|
</div>
|
||
|
</section>
|
||
|
</div>
|
||
|
<script>
|
||
|
jQuery(function () {
|
||
|
SphinxRtdTheme.Navigation.enable(true);
|
||
|
});
|
||
|
</script>
|
||
|
|
||
|
</body>
|
||
|
</html>
|