All modules for which code is available
- gym.core
- mushroom_rl.algorithms.actor_critic.classic_actor_critic.copdac_q
- mushroom_rl.algorithms.actor_critic.classic_actor_critic.stochastic_ac
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.a2c
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.ddpg
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.deep_actor_critic
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.ppo
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.sac
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.td3
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.trpo
- mushroom_rl.algorithms.agent
- mushroom_rl.algorithms.policy_search.black_box_optimization.black_box_optimization
- mushroom_rl.algorithms.policy_search.black_box_optimization.pgpe
- mushroom_rl.algorithms.policy_search.black_box_optimization.reps
- mushroom_rl.algorithms.policy_search.black_box_optimization.rwr
- mushroom_rl.algorithms.policy_search.policy_gradient.enac
- mushroom_rl.algorithms.policy_search.policy_gradient.gpomdp
- mushroom_rl.algorithms.policy_search.policy_gradient.policy_gradient
- mushroom_rl.algorithms.policy_search.policy_gradient.reinforce
- mushroom_rl.algorithms.value.batch_td.batch_td
- mushroom_rl.algorithms.value.batch_td.fqi
- mushroom_rl.algorithms.value.batch_td.lspi
- mushroom_rl.algorithms.value.dqn.categorical_dqn
- mushroom_rl.algorithms.value.dqn.dqn
- mushroom_rl.algorithms.value.td.double_q_learning
- mushroom_rl.algorithms.value.td.expected_sarsa
- mushroom_rl.algorithms.value.td.q_lambda
- mushroom_rl.algorithms.value.td.q_learning
- mushroom_rl.algorithms.value.td.r_learning
- mushroom_rl.algorithms.value.td.rq_learning
- mushroom_rl.algorithms.value.td.sarsa
- mushroom_rl.algorithms.value.td.sarsa_lambda
- mushroom_rl.algorithms.value.td.sarsa_lambda_continuous
- mushroom_rl.algorithms.value.td.speedy_q_learning
- mushroom_rl.algorithms.value.td.td
- mushroom_rl.algorithms.value.td.true_online_sarsa_lambda
- mushroom_rl.algorithms.value.td.weighted_q_learning
- mushroom_rl.approximators._implementations.ensemble
- mushroom_rl.approximators.parametric.linear
- mushroom_rl.approximators.parametric.torch_approximator
- mushroom_rl.approximators.regressor
- mushroom_rl.core.core
- mushroom_rl.core.serialization
- mushroom_rl.distributions.distribution
- mushroom_rl.distributions.gaussian
- mushroom_rl.environments.atari
- mushroom_rl.environments.car_on_hill
- mushroom_rl.environments.cart_pole
- mushroom_rl.environments.dm_control_env
- mushroom_rl.environments.environment
- mushroom_rl.environments.finite_mdp
- mushroom_rl.environments.generators.grid_world
- mushroom_rl.environments.generators.simple_chain
- mushroom_rl.environments.generators.taxi
- mushroom_rl.environments.grid_world
- mushroom_rl.environments.gym_env
- mushroom_rl.environments.inverted_pendulum
- mushroom_rl.environments.lqr
- mushroom_rl.environments.mujoco
- mushroom_rl.environments.puddle_world
- mushroom_rl.environments.segway
- mushroom_rl.environments.ship_steering
- mushroom_rl.features.basis.fourier
- mushroom_rl.features.basis.gaussian_rbf
- mushroom_rl.features.basis.polynomial
- mushroom_rl.features.features
- mushroom_rl.features.tensors.gaussian_tensor
- mushroom_rl.features.tiles.tiles
- mushroom_rl.policy.deterministic_policy
- mushroom_rl.policy.gaussian_policy
- mushroom_rl.policy.noise_policy
- mushroom_rl.policy.policy
- mushroom_rl.policy.td_policy
- mushroom_rl.policy.torch_policy
- mushroom_rl.solvers.car_on_hill
- mushroom_rl.solvers.dynamic_programming
- mushroom_rl.solvers.lqr
- mushroom_rl.utils.angles
- mushroom_rl.utils.callbacks.callback
- mushroom_rl.utils.callbacks.collect_dataset
- mushroom_rl.utils.callbacks.collect_max_q
- mushroom_rl.utils.callbacks.collect_parameters
- mushroom_rl.utils.callbacks.collect_q
- mushroom_rl.utils.dataset
- mushroom_rl.utils.eligibility_trace
- mushroom_rl.utils.features
- mushroom_rl.utils.folder
- mushroom_rl.utils.frames
- mushroom_rl.utils.minibatches
- mushroom_rl.utils.numerical_gradient
- mushroom_rl.utils.parameters
- mushroom_rl.utils.replay_memory
- mushroom_rl.utils.spaces
- mushroom_rl.utils.table
- mushroom_rl.utils.torch
- mushroom_rl.utils.value_functions
- mushroom_rl.utils.variance_parameters
- mushroom_rl.utils.viewer