mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 19:20:19 +01:00
Docs changes - fixing blogpost links, removing importing all exploration policies (#139)
* updated docs * removing imports for all exploration policies in __init__ + setting the right blog-post link * small cleanups
This commit is contained in:
committed by
Scott Leishman
parent
155b78b995
commit
f12857a8c7
@@ -226,7 +226,7 @@
|
||||
</li>
|
||||
<li><a href="components/agents/policy_optimization/ac.html#rl_coach.agents.actor_critic_agent.ActorCriticAlgorithmParameters">ActorCriticAlgorithmParameters (class in rl_coach.agents.actor_critic_agent)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.AdditiveNoise">AdditiveNoise (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.additive_noise.AdditiveNoise">AdditiveNoise (class in rl_coach.exploration_policies.additive_noise)</a>
|
||||
</li>
|
||||
</ul></td>
|
||||
<td style="width: 33%; vertical-align: top;"><ul>
|
||||
@@ -262,11 +262,11 @@
|
||||
</li>
|
||||
<li><a href="components/agents/imitation/bc.html#rl_coach.agents.bc_agent.BCAlgorithmParameters">BCAlgorithmParameters (class in rl_coach.agents.bc_agent)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.Boltzmann">Boltzmann (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.boltzmann.Boltzmann">Boltzmann (class in rl_coach.exploration_policies.boltzmann)</a>
|
||||
</li>
|
||||
</ul></td>
|
||||
<td style="width: 33%; vertical-align: top;"><ul>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.Bootstrapped">Bootstrapped (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.bootstrapped.Bootstrapped">Bootstrapped (class in rl_coach.exploration_policies.bootstrapped)</a>
|
||||
</li>
|
||||
<li><a href="components/spaces.html#rl_coach.spaces.BoxActionSpace">BoxActionSpace (class in rl_coach.spaces)</a>
|
||||
</li>
|
||||
@@ -288,11 +288,11 @@
|
||||
</ul></li>
|
||||
<li><a href="components/environments/index.html#rl_coach.environments.carla_environment.CarlaEnvironment">CarlaEnvironment (class in rl_coach.environments.carla_environment)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.Categorical">Categorical (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.categorical.Categorical">Categorical (class in rl_coach.exploration_policies.categorical)</a>
|
||||
</li>
|
||||
<li><a href="components/agents/value_optimization/categorical_dqn.html#rl_coach.agents.categorical_dqn_agent.CategoricalDQNAlgorithmParameters">CategoricalDQNAlgorithmParameters (class in rl_coach.agents.categorical_dqn_agent)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ExplorationPolicy.change_phase">change_phase() (rl_coach.exploration_policies.ExplorationPolicy method)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.exploration_policy.ExplorationPolicy.change_phase">change_phase() (rl_coach.exploration_policies.exploration_policy.ExplorationPolicy method)</a>
|
||||
</li>
|
||||
<li><a href="components/agents/index.html#rl_coach.agents.agent.Agent.choose_action">choose_action() (rl_coach.agents.agent.Agent method)</a>
|
||||
|
||||
@@ -328,7 +328,7 @@
|
||||
</li>
|
||||
<li><a href="components/architectures/index.html#rl_coach.architectures.architecture.Architecture.construct">construct() (rl_coach.architectures.architecture.Architecture static method)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ContinuousEntropy">ContinuousEntropy (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.continuous_entropy.ContinuousEntropy">ContinuousEntropy (class in rl_coach.exploration_policies.continuous_entropy)</a>
|
||||
</li>
|
||||
<li><a href="components/environments/index.html#rl_coach.environments.control_suite_environment.ControlSuiteEnvironment">ControlSuiteEnvironment (class in rl_coach.environments.control_suite_environment)</a>
|
||||
</li>
|
||||
@@ -368,7 +368,7 @@
|
||||
<h2 id="E">E</h2>
|
||||
<table style="width: 100%" class="indextable genindextable"><tr>
|
||||
<td style="width: 33%; vertical-align: top;"><ul>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.EGreedy">EGreedy (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.e_greedy.EGreedy">EGreedy (class in rl_coach.exploration_policies.e_greedy)</a>
|
||||
</li>
|
||||
<li><a href="components/agents/index.html#rl_coach.agents.agent.Agent.emulate_act_on_trainer">emulate_act_on_trainer() (rl_coach.agents.agent.Agent method)</a>
|
||||
|
||||
@@ -398,7 +398,7 @@
|
||||
</li>
|
||||
<li><a href="components/memories/index.html#rl_coach.memories.non_episodic.ExperienceReplay">ExperienceReplay (class in rl_coach.memories.non_episodic)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ExplorationPolicy">ExplorationPolicy (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.exploration_policy.ExplorationPolicy">ExplorationPolicy (class in rl_coach.exploration_policies.exploration_policy)</a>
|
||||
</li>
|
||||
</ul></td>
|
||||
</tr></table>
|
||||
@@ -416,7 +416,7 @@
|
||||
<td style="width: 33%; vertical-align: top;"><ul>
|
||||
<li><a href="components/core_types.html#rl_coach.core_types.Batch.game_overs">game_overs() (rl_coach.core_types.Batch method)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ExplorationPolicy.get_action">get_action() (rl_coach.exploration_policies.ExplorationPolicy method)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.exploration_policy.ExplorationPolicy.get_action">get_action() (rl_coach.exploration_policies.exploration_policy.ExplorationPolicy method)</a>
|
||||
</li>
|
||||
<li><a href="components/environments/index.html#rl_coach.environments.environment.Environment.get_action_from_user">get_action_from_user() (rl_coach.environments.environment.Environment method)</a>
|
||||
</li>
|
||||
@@ -466,7 +466,7 @@
|
||||
</li>
|
||||
<li><a href="components/spaces.html#rl_coach.spaces.GoalsSpace.DistanceMetric">GoalsSpace.DistanceMetric (class in rl_coach.spaces)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.Greedy">Greedy (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.greedy.Greedy">Greedy (class in rl_coach.exploration_policies.greedy)</a>
|
||||
</li>
|
||||
<li><a href="components/environments/index.html#rl_coach.environments.gym_environment.GymEnvironment">GymEnvironment (class in rl_coach.environments.gym_environment)</a>
|
||||
</li>
|
||||
@@ -626,7 +626,7 @@
|
||||
<li><a href="test.html#rl_coach.agents.dqn_agent.DQNAgent.observe">(rl_coach.agents.dqn_agent.DQNAgent method)</a>
|
||||
</li>
|
||||
</ul></li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.OUProcess">OUProcess (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ou_process.OUProcess">OUProcess (class in rl_coach.exploration_policies.ou_process)</a>
|
||||
</li>
|
||||
</ul></td>
|
||||
</tr></table>
|
||||
@@ -640,7 +640,7 @@
|
||||
</li>
|
||||
<li><a href="components/architectures/index.html#rl_coach.architectures.network_wrapper.NetworkWrapper.parallel_prediction">parallel_prediction() (rl_coach.architectures.network_wrapper.NetworkWrapper method)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ParameterNoise">ParameterNoise (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.parameter_noise.ParameterNoise">ParameterNoise (class in rl_coach.exploration_policies.parameter_noise)</a>
|
||||
</li>
|
||||
<li><a href="components/agents/index.html#rl_coach.agents.agent.Agent.parent">parent (rl_coach.agents.agent.Agent attribute)</a>
|
||||
|
||||
@@ -714,9 +714,9 @@
|
||||
</ul></li>
|
||||
<li><a href="components/environments/index.html#rl_coach.environments.environment.Environment.render">render() (rl_coach.environments.environment.Environment method)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ExplorationPolicy.requires_action_values">requires_action_values() (rl_coach.exploration_policies.ExplorationPolicy method)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.exploration_policy.ExplorationPolicy.requires_action_values">requires_action_values() (rl_coach.exploration_policies.exploration_policy.ExplorationPolicy method)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ExplorationPolicy.reset">reset() (rl_coach.exploration_policies.ExplorationPolicy method)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.exploration_policy.ExplorationPolicy.reset">reset() (rl_coach.exploration_policies.exploration_policy.ExplorationPolicy method)</a>
|
||||
</li>
|
||||
<li><a href="components/architectures/index.html#rl_coach.architectures.architecture.Architecture.reset_accumulated_gradients">reset_accumulated_gradients() (rl_coach.architectures.architecture.Architecture method)</a>
|
||||
</li>
|
||||
@@ -870,7 +870,7 @@
|
||||
</li>
|
||||
<li><a href="components/memories/index.html#rl_coach.memories.non_episodic.TransitionCollection">TransitionCollection (class in rl_coach.memories.non_episodic)</a>
|
||||
</li>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.TruncatedNormal">TruncatedNormal (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.truncated_normal.TruncatedNormal">TruncatedNormal (class in rl_coach.exploration_policies.truncated_normal)</a>
|
||||
</li>
|
||||
</ul></td>
|
||||
</tr></table>
|
||||
@@ -878,7 +878,7 @@
|
||||
<h2 id="U">U</h2>
|
||||
<table style="width: 100%" class="indextable genindextable"><tr>
|
||||
<td style="width: 33%; vertical-align: top;"><ul>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.UCB">UCB (class in rl_coach.exploration_policies)</a>
|
||||
<li><a href="components/exploration_policies/index.html#rl_coach.exploration_policies.ucb.UCB">UCB (class in rl_coach.exploration_policies.ucb)</a>
|
||||
</li>
|
||||
<li><a href="components/core_types.html#rl_coach.core_types.Episode.update_discounted_rewards">update_discounted_rewards() (rl_coach.core_types.Episode method)</a>
|
||||
</li>
|
||||
|
||||
Reference in New Issue
Block a user