All modules for which code is available
- mushroom_rl.algorithms.actor_critic.classic_actor_critic.copdac_q
- mushroom_rl.algorithms.actor_critic.classic_actor_critic.stochastic_ac
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.a2c
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.ddpg
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.deep_actor_critic
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.ppo
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.sac
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.td3
- mushroom_rl.algorithms.actor_critic.deep_actor_critic.trpo
- mushroom_rl.algorithms.policy_search.black_box_optimization.constrained_reps
- mushroom_rl.algorithms.policy_search.black_box_optimization.more
- mushroom_rl.algorithms.policy_search.black_box_optimization.pgpe
- mushroom_rl.algorithms.policy_search.black_box_optimization.reps
- mushroom_rl.algorithms.policy_search.black_box_optimization.rwr
- mushroom_rl.algorithms.policy_search.policy_gradient.enac
- mushroom_rl.algorithms.policy_search.policy_gradient.gpomdp
- mushroom_rl.algorithms.policy_search.policy_gradient.reinforce
- mushroom_rl.algorithms.value.batch_td.boosted_fqi
- mushroom_rl.algorithms.value.batch_td.double_fqi
- mushroom_rl.algorithms.value.batch_td.fqi
- mushroom_rl.algorithms.value.batch_td.lspi
- mushroom_rl.algorithms.value.dqn.abstract_dqn
- mushroom_rl.algorithms.value.dqn.averaged_dqn
- mushroom_rl.algorithms.value.dqn.categorical_dqn
- mushroom_rl.algorithms.value.dqn.double_dqn
- mushroom_rl.algorithms.value.dqn.dqn
- mushroom_rl.algorithms.value.dqn.dueling_dqn
- mushroom_rl.algorithms.value.dqn.maxmin_dqn
- mushroom_rl.algorithms.value.dqn.noisy_dqn
- mushroom_rl.algorithms.value.dqn.quantile_dqn
- mushroom_rl.algorithms.value.dqn.rainbow
- mushroom_rl.algorithms.value.td.double_q_learning
- mushroom_rl.algorithms.value.td.expected_sarsa
- mushroom_rl.algorithms.value.td.maxmin_q_learning
- mushroom_rl.algorithms.value.td.q_lambda
- mushroom_rl.algorithms.value.td.q_learning
- mushroom_rl.algorithms.value.td.r_learning
- mushroom_rl.algorithms.value.td.rq_learning
- mushroom_rl.algorithms.value.td.sarsa
- mushroom_rl.algorithms.value.td.sarsa_lambda
- mushroom_rl.algorithms.value.td.sarsa_lambda_continuous
- mushroom_rl.algorithms.value.td.speedy_q_learning
- mushroom_rl.algorithms.value.td.true_online_sarsa_lambda
- mushroom_rl.algorithms.value.td.weighted_q_learning
- mushroom_rl.approximators.parametric.cmac
- mushroom_rl.approximators.parametric.linear
- mushroom_rl.approximators.parametric.torch_approximator
- mushroom_rl.approximators.regressor
- mushroom_rl.core.agent
- mushroom_rl.core.core
- mushroom_rl.core.environment
- mushroom_rl.core.logger.console_logger
- mushroom_rl.core.logger.data_logger
- mushroom_rl.core.logger.logger
- mushroom_rl.core.serialization
- mushroom_rl.distributions.distribution
- mushroom_rl.distributions.gaussian
- mushroom_rl.environments.atari
- mushroom_rl.environments.car_on_hill
- mushroom_rl.environments.cart_pole
- mushroom_rl.environments.dm_control_env
- mushroom_rl.environments.finite_mdp
- mushroom_rl.environments.generators.grid_world
- mushroom_rl.environments.generators.simple_chain
- mushroom_rl.environments.generators.taxi
- mushroom_rl.environments.grid_world
- mushroom_rl.environments.gym_env
- mushroom_rl.environments.habitat_env
- mushroom_rl.environments.igibson_env
- mushroom_rl.environments.inverted_pendulum
- mushroom_rl.environments.lqr
- mushroom_rl.environments.minigrid_env
- mushroom_rl.environments.mujoco
- mushroom_rl.environments.mujoco_envs.air_hockey.base
- mushroom_rl.environments.mujoco_envs.air_hockey.defend
- mushroom_rl.environments.mujoco_envs.air_hockey.double
- mushroom_rl.environments.mujoco_envs.air_hockey.hit
- mushroom_rl.environments.mujoco_envs.air_hockey.prepare
- mushroom_rl.environments.mujoco_envs.air_hockey.repel
- mushroom_rl.environments.mujoco_envs.air_hockey.single
- mushroom_rl.environments.mujoco_envs.ball_in_a_cup
- mushroom_rl.environments.puddle_world
- mushroom_rl.environments.pybullet
- mushroom_rl.environments.pybullet_envs.air_hockey.base
- mushroom_rl.environments.pybullet_envs.air_hockey.defend
- mushroom_rl.environments.pybullet_envs.air_hockey.hit
- mushroom_rl.environments.pybullet_envs.air_hockey.single
- mushroom_rl.environments.segway
- mushroom_rl.environments.ship_steering
- mushroom_rl.features.basis.fourier
- mushroom_rl.features.basis.gaussian_rbf
- mushroom_rl.features.basis.polynomial
- mushroom_rl.features.features
- mushroom_rl.features.tiles.tiles
- mushroom_rl.features.tiles.voronoi
- mushroom_rl.policy.deterministic_policy
- mushroom_rl.policy.gaussian_policy
- mushroom_rl.policy.noise_policy
- mushroom_rl.policy.policy
- mushroom_rl.policy.td_policy
- mushroom_rl.policy.torch_policy
- mushroom_rl.solvers.car_on_hill
- mushroom_rl.solvers.dynamic_programming
- mushroom_rl.solvers.lqr
- mushroom_rl.utils.angles
- mushroom_rl.utils.callbacks.callback
- mushroom_rl.utils.callbacks.collect_dataset
- mushroom_rl.utils.callbacks.collect_max_q
- mushroom_rl.utils.callbacks.collect_parameters
- mushroom_rl.utils.callbacks.collect_q
- mushroom_rl.utils.dataset
- mushroom_rl.utils.eligibility_trace
- mushroom_rl.utils.features
- mushroom_rl.utils.folder
- mushroom_rl.utils.frames
- mushroom_rl.utils.minibatches
- mushroom_rl.utils.numerical_gradient
- mushroom_rl.utils.parameters
- mushroom_rl.utils.replay_memory
- mushroom_rl.utils.spaces
- mushroom_rl.utils.table
- mushroom_rl.utils.torch
- mushroom_rl.utils.value_functions
- mushroom_rl.utils.variance_parameters
- mushroom_rl.utils.viewer