garage
v2020.06.0
Installation
Running Experiments
Implementing New Environments
Implementing New Algorithms
garage
Docs
»
Index
Edit on GitHub
Index
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
K
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
W
|
Z
A
action (TimeStep attribute)
action_from_direction() (GridWorldEnv static method)
,
[1]
action_space (DmControlEnv attribute)
,
[1]
(EnvSpec attribute)
,
[1]
(GridWorldEnv attribute)
,
[1]
(ParallelVecEnvExecutor attribute)
,
[1]
(PointEnv attribute)
,
[1]
,
[2]
,
[3]
(Policy attribute)
,
[1]
,
[2]
,
[3]
,
[4]
,
[5]
(VecEnvExecutor attribute)
,
[1]
actions (MAMLTrajectoryBatch attribute)
(TimeStepBatch attribute)
(TrajectoryBatch attribute)
active_task_index (MultiEnvWrapper attribute)
,
[1]
adapt_policy() (MAML method)
(MetaRLAlgorithm method)
,
[1]
(PEARL method)
,
[1]
(RL2 method)
,
[1]
add_history() (ISSampler method)
,
[1]
add_path() (HERReplayBuffer method)
,
[1]
(PathBuffer method)
,
[1]
add_transition() (ReplayBuffer method)
,
[1]
add_transitions() (ReplayBuffer method)
,
[1]
AddGaussianNoise (class in garage.np.exploration_policies)
(class in garage.np.exploration_policies.add_gaussian_noise)
AddOrnsteinUhlenbeckNoise (class in garage.np.exploration_policies)
(class in garage.np.exploration_policies.add_ornstein_uhlenbeck_noise)
agent (DefaultWorker attribute)
,
[1]
(PEARLWorker attribute)
(RL2Worker attribute)
(TFWorkerWrapper attribute)
,
[1]
(TaskEmbeddingWorker attribute)
agent_info (TimeStep attribute)
agent_infos (TimeStepBatch attribute)
(TrajectoryBatch attribute)
AtariEnv (class in garage.envs.wrappers)
(class in garage.envs.wrappers.atari_env)
augment_env_spec() (garage.torch.algos.PEARL class method)
(garage.torch.algos.pearl.PEARL class method)
augmented_observation_space (TaskEmbeddingPolicy attribute)
,
[1]
B
Baseline (class in garage.np.baselines)
(class in garage.np.baselines.baseline)
baselines (MAMLTrajectoryBatch attribute)
BaseModel (class in garage.tf.models)
(class in garage.tf.models.model)
BaseSampler (class in garage.sampler.sampler_deprecated)
BatchDataset (class in garage.np.optimizers)
(class in garage.np.optimizers.minibatch_dataset)
BatchSampler (class in garage.sampler)
(class in garage.sampler.batch_sampler)
(class in garage.tf.samplers)
(class in garage.tf.samplers.batch_sampler)
Bernoulli (class in garage.tf.distributions)
(class in garage.tf.distributions.bernoulli)
BernoulliMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.bernoulli_mlp_regressor)
build() (BaseModel method)
,
[1]
(CategoricalCNNPolicy method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPEncoder method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
(GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(Model method)
,
[1]
(StochasticEncoder method)
,
[1]
build_eval() (HessianVectorProduct method)
C
Categorical (class in garage.tf.distributions)
(class in garage.tf.distributions.categorical)
CategoricalCNNModel (class in garage.tf.models)
(class in garage.tf.models.categorical_cnn_model)
CategoricalCNNPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_cnn_policy)
CategoricalGRUModel (class in garage.tf.models)
(class in garage.tf.models.categorical_gru_model)
CategoricalGRUPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_gru_policy)
CategoricalLSTMModel (class in garage.tf.models)
(class in garage.tf.models.categorical_lstm_model)
CategoricalLSTMPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_lstm_policy)
CategoricalMLPModel (class in garage.tf.models)
(class in garage.tf.models.categorical_mlp_model)
CategoricalMLPPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_mlp_policy)
CategoricalMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.categorical_mlp_regressor)
CategoricalMLPRegressorModel (class in garage.tf.regressors.categorical_mlp_regressor_model)
cdf() (TanhNormal method)
,
[1]
CEM (class in garage.np.algos)
(class in garage.np.algos.cem)
center_advs() (in module garage.tf.misc.tensor_utils)
cg() (in module garage.tf.optimizers.conjugate_gradient_optimizer)
child_proc_shutdown() (in module garage.experiment.experiment_wrapper)
clear() (PathBuffer method)
,
[1]
ClipReward (class in garage.envs.wrappers)
(class in garage.envs.wrappers.clip_reward)
clone() (CategoricalCNNPolicy method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(CategoricalMLPRegressorModel method)
(ContinuousCNNQFunction method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(ContinuousMLPQFunction method)
,
[1]
(DiscreteCNNQFunction method)
,
[1]
(DiscreteMLPQFunction method)
,
[1]
(Encoder method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPEncoder method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
(GaussianMLPRegressorModel method)
(GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(QFunction method)
,
[1]
close() (DmControlEnv method)
,
[1]
(DmControlViewer method)
,
[1]
(GarageEnv method)
,
[1]
(MultiEnvWrapper method)
,
[1]
(ParallelVecEnvExecutor method)
,
[1]
(Plotter method)
,
[1]
,
[2]
,
[3]
(StatefulPool method)
(VecEnvExecutor method)
,
[1]
(in module garage.sampler.parallel_sampler)
CMAES (class in garage.np.algos)
(class in garage.np.algos.cma_es)
cnn() (in module garage.tf.models.cnn)
cnn_with_max_pooling() (in module garage.tf.models.cnn)
CNNMLPMergeModel (class in garage.tf.models)
(class in garage.tf.models.cnn_mlp_merge_model)
CNNModel (class in garage.tf.models)
(class in garage.tf.models.cnn_model)
CNNModelWithMaxPooling (class in garage.tf.models)
(class in garage.tf.models.cnn_model_max_pooling)
collect_rollout() (DefaultWorker method)
,
[1]
(TFWorkerWrapper method)
,
[1]
(TaskEmbeddingWorker method)
(VecWorker method)
,
[1]
(Worker method)
,
[1]
compile_function() (in module garage.tf.misc.tensor_utils)
compute_advantages() (in module garage.tf.misc.tensor_utils)
(in module garage.torch)
compute_kl_div() (ContextConditionedPolicy method)
,
[1]
compute_loss() (GaussianMLPValueFunction method)
,
[1]
(ValueFunction method)
,
[1]
concat_tensor_dict_list() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
concat_tensor_list() (in module garage.tf.misc.tensor_utils)
concatenate() (garage.TimeStepBatch class method)
(garage.TrajectoryBatch class method)
ConjugateGradientOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.conjugate_gradient_optimizer)
(class in garage.torch.optimizers)
(class in garage.torch.optimizers.conjugate_gradient_optimizer)
constraint_val() (ConjugateGradientOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
ConstructEnvsSampler (class in garage.experiment.task_sampler)
context (ContextConditionedPolicy attribute)
,
[1]
ContextConditionedPolicy (class in garage.torch.policies)
(class in garage.torch.policies.context_conditioned_policy)
ContinuousCNNQFunction (class in garage.tf.q_functions)
(class in garage.tf.q_functions.continuous_cnn_q_function)
ContinuousMLPBaseline (class in garage.tf.baselines)
(class in garage.tf.baselines.continuous_mlp_baseline)
ContinuousMLPPolicy (class in garage.tf.policies)
(class in garage.tf.policies.continuous_mlp_policy)
ContinuousMLPQFunction (class in garage.tf.q_functions)
(class in garage.tf.q_functions.continuous_mlp_q_function)
(class in garage.torch.q_functions)
(class in garage.torch.q_functions.continuous_mlp_q_function)
ContinuousMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.continuous_mlp_regressor)
cross_entropy_sym() (Categorical method)
,
[1]
D
DDPG (class in garage.tf.algos)
(class in garage.tf.algos.ddpg)
(class in garage.torch.algos)
(class in garage.torch.algos.ddpg)
default() (LogEncoder method)
DEFAULT_N_ENVS (VecWorker attribute)
,
[1]
DefaultWorker (class in garage.sampler)
(class in garage.sampler.default_worker)
DeterministicMLPPolicy (class in garage.torch.policies)
(class in garage.torch.policies.deterministic_mlp_policy)
DiagonalGaussian (class in garage.tf.distributions)
(class in garage.tf.distributions.diagonal_gaussian)
dict_np_to_torch() (in module garage.torch)
DifferentiableSGD (class in garage.torch.optimizers)
(class in garage.torch.optimizers.differentiable_sgd)
dim (Bernoulli attribute)
,
[1]
(Categorical attribute)
,
[1]
(DiagonalGaussian attribute)
,
[1]
(Distribution attribute)
,
[1]
(RecurrentCategorical attribute)
,
[1]
disable() (Plotter static method)
,
[1]
discount_cumsum() (in module garage.misc.tensor_utils)
discounted_returns() (in module garage.tf.misc.tensor_utils)
DiscreteCNNQFunction (class in garage.tf.q_functions)
(class in garage.tf.q_functions.discrete_cnn_q_function)
DiscreteMLPQFunction (class in garage.tf.q_functions)
(class in garage.tf.q_functions.discrete_mlp_q_function)
DiscreteQfDerivedPolicy (class in garage.tf.policies)
(class in garage.tf.policies.discrete_qf_derived_policy)
dist_info() (StochasticPolicy method)
,
[1]
dist_info_keys (Bernoulli attribute)
,
[1]
(Distribution attribute)
,
[1]
dist_info_specs (Categorical attribute)
,
[1]
(DiagonalGaussian attribute)
,
[1]
(Distribution attribute)
,
[1]
(RecurrentCategorical attribute)
,
[1]
dist_info_sym() (BernoulliMLPRegressor method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
distribution (BernoulliMLPRegressor attribute)
,
[1]
(CategoricalCNNPolicy attribute)
,
[1]
(CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(CategoricalMLPPolicy attribute)
,
[1]
(CategoricalMLPRegressor attribute)
,
[1]
Distribution (class in garage.tf.distributions)
(class in garage.tf.distributions.distribution)
distribution (GaussianCNNRegressor attribute)
,
[1]
(GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(GaussianMLPEncoder attribute)
,
[1]
(GaussianMLPPolicy attribute)
,
[1]
(GaussianMLPRegressor attribute)
,
[1]
(GaussianMLPTaskEmbeddingPolicy attribute)
,
[1]
(StochasticEncoder attribute)
,
[1]
(StochasticModule attribute)
,
[1]
(StochasticPolicy attribute)
,
[1]
DmControlEnv (class in garage.envs.dm_control)
(class in garage.envs.dm_control.dm_control_env)
DmControlViewer (class in garage.envs.dm_control)
(class in garage.envs.dm_control.dm_control_viewer)
DQN (class in garage.tf.algos)
(class in garage.tf.algos.dqn)
dump_json() (in module garage.experiment.experiment)
E
enable (Plotter attribute)
,
[1]
Encoder (class in garage.np.embeddings)
(class in garage.np.embeddings.encoder)
(class in garage.tf.embeddings)
(class in garage.tf.embeddings.encoder)
encoder (TaskEmbeddingPolicy attribute)
,
[1]
encoder_distribution (TaskEmbeddingPolicy attribute)
,
[1]
entropy() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
(TanhNormal method)
,
[1]
entropy_sym() (Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
enumerate_support() (TanhNormal method)
,
[1]
env (DefaultWorker attribute)
,
[1]
(PEARLWorker attribute)
(RL2Worker attribute)
(TFWorkerWrapper attribute)
,
[1]
(TaskEmbeddingWorker attribute)
env_info (TimeStep attribute)
env_infos (TimeStepBatch attribute)
(TrajectoryBatch attribute)
env_spec (Policy attribute)
,
[1]
(TimeStep attribute)
(TimeStepBatch attribute)
(TrajectoryBatch attribute)
EnvPoolSampler (class in garage.experiment.task_sampler)
EnvSpec (class in garage.envs)
(class in garage.envs.env_spec)
EnvUpdate (class in garage.sampler.env_update)
EpisodicLife (class in garage.envs.wrappers)
(class in garage.envs.wrappers.episodic_life)
EpsilonGreedyPolicy (class in garage.np.exploration_policies)
(class in garage.np.exploration_policies.epsilon_greedy_policy)
ERWR (class in garage.tf.algos)
(class in garage.tf.algos.erwr)
evaluate() (MetaEvaluator method)
,
[1]
(TENPO method)
,
[1]
ExistingEnvUpdate (class in garage.sampler.env_update)
expand() (TanhNormal method)
,
[1]
ExperimentContext (class in garage.experiment.experiment)
ExperimentStats (class in garage.experiment.local_runner)
ExperimentTemplate (class in garage.experiment.experiment)
explained_variance_1d() (in module garage.misc.tensor_utils)
ExplorationPolicy (class in garage.np.exploration_policies)
(class in garage.np.exploration_policies.exploration_policy)
F
filter_valids() (in module garage.tf.misc.tensor_utils)
(in module garage.torch)
filter_valids_dict() (in module garage.tf.misc.tensor_utils)
FiniteDifferenceHvp (class in garage.tf.optimizers)
(class in garage.tf.optimizers.conjugate_gradient_optimizer)
FireReset (class in garage.envs.wrappers)
(class in garage.envs.wrappers.fire_reset)
FirstOrderOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.first_order_optimizer)
fit() (Baseline method)
,
[1]
(BernoulliMLPRegressor method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(ContinuousMLPRegressor method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(GaussianMLPRegressor method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(Regressor method)
,
[1]
(ZeroBaseline method)
,
[1]
FixedPolicy (class in garage.np.policies)
(class in garage.np.policies.fixed_policy)
flat_to_params() (Module method)
,
[1]
flatten_batch() (in module garage.tf.misc.tensor_utils)
(in module garage.torch)
flatten_batch_dict() (in module garage.tf.misc.tensor_utils)
flatten_inputs() (in module garage.tf.misc.tensor_utils)
flatten_tensor_variables() (in module garage.tf.misc.tensor_utils)
flatten_tensors() (in module garage.misc.tensor_utils)
forward() (ContextConditionedPolicy method)
,
[1]
(ContinuousMLPQFunction method)
,
[1]
(DeterministicMLPPolicy method)
,
[1]
(GaussianMLPBaseModule method)
(GaussianMLPPolicy method)
,
[1]
(GaussianMLPValueFunction method)
,
[1]
(MLPModule method)
,
[1]
(MultiHeadedMLPModule method)
,
[1]
(StochasticPolicy method)
(TanhGaussianMLPPolicy method)
,
[1]
from_onehot() (in module garage.tf.distributions.categorical)
from_suite() (garage.envs.dm_control.dm_control_env.DmControlEnv class method)
(garage.envs.dm_control.DmControlEnv class method)
from_time_step_list() (garage.TimeStepBatch class method)
from_trajectory_list() (garage.TrajectoryBatch class method)
from_worker_factory() (garage.sampler.local_sampler.LocalSampler class method)
(garage.sampler.LocalSampler class method)
(garage.sampler.MultiprocessingSampler class method)
(garage.sampler.RaySampler class method)
(garage.sampler.Sampler class method)
(garage.sampler.multiprocessing_sampler.MultiprocessingSampler class method)
(garage.sampler.ray_sampler.RaySampler class method)
(garage.sampler.sampler.Sampler class method)
full (ReplayBuffer attribute)
,
[1]
G
garage (module)
garage.envs (module)
garage.envs.dm_control (module)
garage.envs.dm_control.dm_control_env (module)
garage.envs.dm_control.dm_control_viewer (module)
garage.envs.env_spec (module)
garage.envs.garage_env (module)
garage.envs.grid_world_env (module)
garage.envs.mujoco (module)
garage.envs.mujoco.half_cheetah_dir_env (module)
garage.envs.mujoco.half_cheetah_env_meta_base (module)
garage.envs.mujoco.half_cheetah_vel_env (module)
garage.envs.multi_env_wrapper (module)
garage.envs.normalized_env (module)
garage.envs.point_env (module)
garage.envs.step (module)
garage.envs.task_onehot_wrapper (module)
garage.envs.wrappers (module)
garage.envs.wrappers.atari_env (module)
garage.envs.wrappers.clip_reward (module)
garage.envs.wrappers.episodic_life (module)
garage.envs.wrappers.fire_reset (module)
garage.envs.wrappers.grayscale (module)
garage.envs.wrappers.max_and_skip (module)
garage.envs.wrappers.noop (module)
garage.envs.wrappers.resize (module)
garage.envs.wrappers.stack_frames (module)
garage.experiment (module)
garage.experiment.deterministic (module)
garage.experiment.experiment (module)
garage.experiment.experiment_wrapper (module)
garage.experiment.local_runner (module)
garage.experiment.local_tf_runner (module)
garage.experiment.meta_evaluator (module)
garage.experiment.snapshotter (module)
garage.experiment.task_sampler (module)
garage.misc (module)
garage.misc.tensor_utils (module)
garage.np (module)
garage.np.algos (module)
garage.np.algos.cem (module)
garage.np.algos.cma_es (module)
garage.np.algos.meta_rl_algorithm (module)
garage.np.algos.nop (module)
garage.np.algos.rl_algorithm (module)
garage.np.baselines (module)
garage.np.baselines.baseline (module)
garage.np.baselines.linear_feature_baseline (module)
garage.np.baselines.linear_multi_feature_baseline (module)
garage.np.baselines.zero_baseline (module)
garage.np.embeddings (module)
garage.np.embeddings.encoder (module)
garage.np.exploration_policies (module)
garage.np.exploration_policies.add_gaussian_noise (module)
garage.np.exploration_policies.add_ornstein_uhlenbeck_noise (module)
garage.np.exploration_policies.epsilon_greedy_policy (module)
garage.np.exploration_policies.exploration_policy (module)
garage.np.optimizers (module)
garage.np.optimizers.minibatch_dataset (module)
garage.np.policies (module)
garage.np.policies.fixed_policy (module)
garage.np.policies.policy (module)
garage.np.policies.scripted_policy (module)
garage.np.q_functions (module)
garage.np.q_functions.q_function (module)
garage.plotter (module)
garage.plotter.plotter (module)
garage.replay_buffer (module)
garage.replay_buffer.her_replay_buffer (module)
garage.replay_buffer.path_buffer (module)
garage.replay_buffer.replay_buffer (module)
garage.sampler (module)
garage.sampler.batch_sampler (module)
garage.sampler.default_worker (module)
garage.sampler.env_update (module)
garage.sampler.is_sampler (module)
garage.sampler.local_sampler (module)
garage.sampler.multiprocessing_sampler (module)
garage.sampler.off_policy_vectorized_sampler (module)
garage.sampler.on_policy_vectorized_sampler (module)
garage.sampler.parallel_sampler (module)
garage.sampler.parallel_vec_env_executor (module)
garage.sampler.ray_sampler (module)
garage.sampler.sampler (module)
garage.sampler.sampler_deprecated (module)
garage.sampler.stateful_pool (module)
garage.sampler.utils (module)
garage.sampler.vec_env_executor (module)
garage.sampler.vec_worker (module)
garage.sampler.worker (module)
garage.sampler.worker_factory (module)
garage.tf (module)
garage.tf.algos (module)
garage.tf.algos.ddpg (module)
garage.tf.algos.dqn (module)
garage.tf.algos.erwr (module)
garage.tf.algos.npo (module)
garage.tf.algos.ppo (module)
garage.tf.algos.reps (module)
garage.tf.algos.rl2 (module)
garage.tf.algos.rl2ppo (module)
garage.tf.algos.rl2trpo (module)
garage.tf.algos.td3 (module)
garage.tf.algos.te (module)
garage.tf.algos.te_npo (module)
garage.tf.algos.te_ppo (module)
garage.tf.algos.tnpg (module)
garage.tf.algos.trpo (module)
garage.tf.algos.vpg (module)
garage.tf.baselines (module)
garage.tf.baselines.continuous_mlp_baseline (module)
garage.tf.baselines.gaussian_cnn_baseline (module)
garage.tf.baselines.gaussian_mlp_baseline (module)
garage.tf.distributions (module)
garage.tf.distributions.bernoulli (module)
garage.tf.distributions.categorical (module)
garage.tf.distributions.diagonal_gaussian (module)
garage.tf.distributions.distribution (module)
garage.tf.distributions.recurrent_categorical (module)
garage.tf.distributions.recurrent_diagonal_gaussian (module)
garage.tf.embeddings (module)
garage.tf.embeddings.encoder (module)
garage.tf.embeddings.gaussian_mlp_encoder (module)
garage.tf.misc (module)
garage.tf.misc.tensor_utils (module)
garage.tf.models (module)
garage.tf.models.categorical_cnn_model (module)
garage.tf.models.categorical_gru_model (module)
garage.tf.models.categorical_lstm_model (module)
garage.tf.models.categorical_mlp_model (module)
garage.tf.models.cnn (module)
garage.tf.models.cnn_mlp_merge_model (module)
garage.tf.models.cnn_model (module)
garage.tf.models.cnn_model_max_pooling (module)
garage.tf.models.gaussian_cnn_model (module)
garage.tf.models.gaussian_gru_model (module)
garage.tf.models.gaussian_lstm_model (module)
garage.tf.models.gaussian_mlp_model (module)
garage.tf.models.gru (module)
garage.tf.models.gru_model (module)
garage.tf.models.lstm (module)
garage.tf.models.lstm_model (module)
garage.tf.models.mlp (module)
garage.tf.models.mlp_dueling_model (module)
garage.tf.models.mlp_merge_model (module)
garage.tf.models.mlp_model (module)
garage.tf.models.model (module)
garage.tf.models.module (module)
garage.tf.models.normalized_input_mlp_model (module)
garage.tf.models.parameter (module)
garage.tf.models.sequential (module)
garage.tf.optimizers (module)
garage.tf.optimizers.conjugate_gradient_optimizer (module)
garage.tf.optimizers.first_order_optimizer (module)
garage.tf.optimizers.lbfgs_optimizer (module)
garage.tf.optimizers.penalty_lbfgs_optimizer (module)
garage.tf.optimizers.utils (module)
garage.tf.plotter (module)
garage.tf.plotter.plotter (module)
garage.tf.policies (module)
garage.tf.policies.categorical_cnn_policy (module)
garage.tf.policies.categorical_gru_policy (module)
garage.tf.policies.categorical_lstm_policy (module)
garage.tf.policies.categorical_mlp_policy (module)
garage.tf.policies.continuous_mlp_policy (module)
garage.tf.policies.discrete_qf_derived_policy (module)
garage.tf.policies.gaussian_gru_policy (module)
garage.tf.policies.gaussian_lstm_policy (module)
garage.tf.policies.gaussian_mlp_policy (module)
garage.tf.policies.gaussian_mlp_task_embedding_policy (module)
garage.tf.policies.policy (module)
garage.tf.policies.task_embedding_policy (module)
garage.tf.policies.uniform_control_policy (module)
garage.tf.q_functions (module)
garage.tf.q_functions.continuous_cnn_q_function (module)
garage.tf.q_functions.continuous_mlp_q_function (module)
garage.tf.q_functions.discrete_cnn_q_function (module)
garage.tf.q_functions.discrete_mlp_q_function (module)
garage.tf.q_functions.q_function (module)
garage.tf.regressors (module)
garage.tf.regressors.bernoulli_mlp_regressor (module)
garage.tf.regressors.categorical_mlp_regressor (module)
garage.tf.regressors.categorical_mlp_regressor_model (module)
garage.tf.regressors.continuous_mlp_regressor (module)
garage.tf.regressors.gaussian_cnn_regressor (module)
garage.tf.regressors.gaussian_cnn_regressor_model (module)
garage.tf.regressors.gaussian_mlp_regressor (module)
garage.tf.regressors.gaussian_mlp_regressor_model (module)
garage.tf.regressors.regressor (module)
garage.tf.samplers (module)
garage.tf.samplers.batch_sampler (module)
garage.tf.samplers.worker (module)
garage.torch (module)
garage.torch.algos (module)
garage.torch.algos.ddpg (module)
garage.torch.algos.maml (module)
garage.torch.algos.maml_ppo (module)
garage.torch.algos.maml_trpo (module)
garage.torch.algos.maml_vpg (module)
garage.torch.algos.mtsac (module)
garage.torch.algos.pearl (module)
garage.torch.algos.ppo (module)
garage.torch.algos.sac (module)
garage.torch.algos.trpo (module)
garage.torch.algos.vpg (module)
garage.torch.distributions (module)
garage.torch.distributions.tanh_normal (module)
garage.torch.embeddings (module)
garage.torch.embeddings.mlp_encoder (module)
garage.torch.modules (module)
garage.torch.modules.gaussian_mlp_module (module)
garage.torch.modules.mlp_module (module)
garage.torch.modules.multi_headed_mlp_module (module)
garage.torch.optimizers (module)
garage.torch.optimizers.conjugate_gradient_optimizer (module)
garage.torch.optimizers.differentiable_sgd (module)
garage.torch.optimizers.optimizer_wrapper (module)
garage.torch.policies (module)
garage.torch.policies.context_conditioned_policy (module)
garage.torch.policies.deterministic_mlp_policy (module)
garage.torch.policies.gaussian_mlp_policy (module)
garage.torch.policies.policy (module)
garage.torch.policies.stochastic_policy (module)
garage.torch.policies.tanh_gaussian_mlp_policy (module)
garage.torch.q_functions (module)
garage.torch.q_functions.continuous_mlp_q_function (module)
garage.torch.value_functions (module)
garage.torch.value_functions.gaussian_mlp_value_function (module)
garage.torch.value_functions.value_function (module)
GarageEnv (class in garage.envs)
(class in garage.envs.garage_env)
GaussianCNNBaseline (class in garage.tf.baselines)
(class in garage.tf.baselines.gaussian_cnn_baseline)
GaussianCNNModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_cnn_model)
GaussianCNNRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.gaussian_cnn_regressor)
GaussianCNNRegressorModel (class in garage.tf.regressors)
(class in garage.tf.regressors.gaussian_cnn_regressor_model)
GaussianGRUModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_gru_model)
GaussianGRUPolicy (class in garage.tf.policies)
(class in garage.tf.policies.gaussian_gru_policy)
GaussianLSTMModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_lstm_model)
GaussianLSTMPolicy (class in garage.tf.policies)
(class in garage.tf.policies.gaussian_lstm_policy)
GaussianMLPBaseline (class in garage.tf.baselines)
(class in garage.tf.baselines.gaussian_mlp_baseline)
GaussianMLPBaseModule (class in garage.torch.modules.gaussian_mlp_module)
GaussianMLPEncoder (class in garage.tf.embeddings)
(class in garage.tf.embeddings.gaussian_mlp_encoder)
GaussianMLPIndependentStdModule (class in garage.torch.modules)
(class in garage.torch.modules.gaussian_mlp_module)
GaussianMLPModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_mlp_model)
GaussianMLPModule (class in garage.torch.modules)
(class in garage.torch.modules.gaussian_mlp_module)
GaussianMLPPolicy (class in garage.tf.policies)
(class in garage.tf.policies.gaussian_mlp_policy)
(class in garage.torch.policies)
(class in garage.torch.policies.gaussian_mlp_policy)
GaussianMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.gaussian_mlp_regressor)
GaussianMLPRegressorModel (class in garage.tf.regressors.gaussian_mlp_regressor_model)
GaussianMLPTaskEmbeddingPolicy (class in garage.tf.policies)
(class in garage.tf.policies.gaussian_mlp_task_embedding_policy)
GaussianMLPTwoHeadedModule (class in garage.torch.modules)
(class in garage.torch.modules.gaussian_mlp_module)
GaussianMLPValueFunction (class in garage.torch.value_functions)
(class in garage.torch.value_functions.gaussian_mlp_value_function)
get() (LazyDict method)
get_action() (AddGaussianNoise method)
,
[1]
(AddOrnsteinUhlenbeckNoise method)
,
[1]
(CategoricalCNNPolicy method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(ContextConditionedPolicy method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(DeterministicMLPPolicy method)
,
[1]
(DiscreteQfDerivedPolicy method)
,
[1]
(EpsilonGreedyPolicy method)
,
[1]
(ExplorationPolicy method)
,
[1]
(FixedPolicy method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
(GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(NoResetPolicy method)
(Policy method)
,
[1]
,
[2]
,
[3]
,
[4]
,
[5]
(RL2AdaptedPolicy method)
(ScriptedPolicy method)
,
[1]
(StochasticPolicy method)
(TaskEmbeddingPolicy method)
,
[1]
(UniformControlPolicy method)
get_action_given_latent() (GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(TaskEmbeddingPolicy method)
,
[1]
get_action_given_task() (GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(TaskEmbeddingPolicy method)
,
[1]
get_action_sym() (ContinuousMLPPolicy method)
,
[1]
get_actions() (AddGaussianNoise method)
,
[1]
(AddOrnsteinUhlenbeckNoise method)
,
[1]
(CategoricalCNNPolicy method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(DeterministicMLPPolicy method)
,
[1]
(DiscreteQfDerivedPolicy method)
,
[1]
(EpsilonGreedyPolicy method)
,
[1]
(ExplorationPolicy method)
,
[1]
(FixedPolicy method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
(GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(Policy method)
,
[1]
,
[2]
,
[3]
(ScriptedPolicy method)
,
[1]
(StochasticPolicy method)
(TaskEmbeddingPolicy method)
,
[1]
(UniformControlPolicy method)
get_actions_given_latents() (GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(TaskEmbeddingPolicy method)
,
[1]
get_actions_given_tasks() (GaussianMLPTaskEmbeddingPolicy method)
,
[1]
(TaskEmbeddingPolicy method)
,
[1]
get_encoder_spec() (garage.tf.algos.te_npo.TENPO class method)
(garage.tf.algos.TENPO class method)
get_env_copy() (LocalRunner method)
,
[1]
get_env_spec() (garage.torch.algos.PEARL class method)
(garage.torch.algos.pearl.PEARL class method)
get_exploration_policy() (MAML method)
(MetaRLAlgorithm method)
,
[1]
(PEARL method)
,
[1]
(RL2 method)
,
[1]
get_global_vars() (Module method)
,
[1]
(QFunction method)
,
[1]
(TaskEmbeddingPolicy method)
,
[1]
get_history_list() (ISSampler method)
,
[1]
get_infer_spec() (garage.tf.algos.te_npo.TENPO class method)
(garage.tf.algos.TENPO class method)
get_latent() (Encoder method)
,
[1]
(GaussianMLPEncoder method)
,
[1]
(TaskEmbeddingPolicy method)
,
[1]
get_latents() (Encoder method)
,
[1]
(GaussianMLPEncoder method)
,
[1]
get_metadata() (in module garage.experiment.experiment)
get_minibatch() (OptimizerWrapper method)
,
[1]
get_param_shapes() (Module method)
,
[1]
get_param_values() (Baseline method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(ExplorationPolicy method)
,
[1]
(FixedPolicy method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(Module method)
,
[1]
(NoResetPolicy method)
(Policy method)
,
[1]
(RL2AdaptedPolicy method)
(ScriptedPolicy method)
,
[1]
(ZeroBaseline method)
,
[1]
get_params() (Module method)
,
[1]
get_params_internal() (ContinuousMLPBaseline method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
get_plotters() (Plotter static method)
,
[1]
,
[2]
,
[3]
get_possible_next_states() (GridWorldEnv method)
,
[1]
get_qval() (ContinuousCNNQFunction method)
,
[1]
(ContinuousMLPQFunction method)
,
[1]
get_qval_sym() (ContinuousCNNQFunction method)
,
[1]
(ContinuousMLPQFunction method)
,
[1]
(DiscreteCNNQFunction method)
,
[1]
(DiscreteMLPQFunction method)
,
[1]
(QFunction method)
,
[1]
get_regularizable_vars() (CategoricalMLPPolicy method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(QFunction method)
,
[1]
get_seed() (in module garage.experiment.deterministic)
get_target_ops() (in module garage.tf.misc.tensor_utils)
get_trainable_vars() (Module method)
,
[1]
(QFunction method)
,
[1]
(TaskEmbeddingPolicy method)
,
[1]
global_device() (in module garage.torch)
graph_inputs() (in module garage.tf.misc.tensor_utils)
Grayscale (class in garage.envs.wrappers)
(class in garage.envs.wrappers.grayscale)
GridWorldEnv (class in garage.envs)
(class in garage.envs.grid_world_env)
grow_pool() (EnvPoolSampler method)
gru() (in module garage.tf.models.gru)
GRUModel (class in garage.tf.models)
(class in garage.tf.models.gru_model)
H
HalfCheetahDirEnv (class in garage.envs.mujoco)
(class in garage.envs.mujoco.half_cheetah_dir_env)
HalfCheetahEnvMetaBase (class in garage.envs.mujoco.half_cheetah_env_meta_base)
HalfCheetahVelEnv (class in garage.envs.mujoco)
(class in garage.envs.mujoco.half_cheetah_vel_env)
HERReplayBuffer (class in garage.replay_buffer)
(class in garage.replay_buffer.her_replay_buffer)
HessianVectorProduct (class in garage.tf.optimizers.conjugate_gradient_optimizer)
history (ISSampler attribute)
,
[1]
I
icdf() (TanhNormal method)
,
[1]
identity_function() (in module garage.sampler.worker_factory)
infer_posterior() (ContextConditionedPolicy method)
,
[1]
init_opt() (DDPG method)
,
[1]
(DQN method)
,
[1]
(NOP method)
,
[1]
(NPO method)
,
[1]
(REPS method)
,
[1]
(TD3 method)
,
[1]
(TENPO method)
,
[1]
init_plot() (Plotter method)
,
[1]
init_worker() (Plotter method)
,
[1]
initialize() (in module garage.sampler.parallel_sampler)
(StatefulPool method)
initialize_tf_vars() (LocalTFRunner method)
,
[1]
InOutSpec (class in garage)
input (DiscreteCNNQFunction attribute)
,
[1]
(DiscreteMLPQFunction attribute)
,
[1]
(GaussianMLPEncoder attribute)
,
[1]
(Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
input_dim (CategoricalCNNPolicy attribute)
,
[1]
(CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(CategoricalMLPPolicy attribute)
,
[1]
(ContinuousMLPPolicy attribute)
,
[1]
(Encoder attribute)
,
[1]
(GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(GaussianMLPEncoder attribute)
,
[1]
(GaussianMLPPolicy attribute)
,
[1]
(MLPEncoder attribute)
,
[1]
input_space (InOutSpec attribute)
inputs (ContinuousCNNQFunction attribute)
,
[1]
(ContinuousMLPQFunction attribute)
,
[1]
(Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
ISSampler (class in garage.sampler)
(class in garage.sampler.is_sampler)
iterate() (BatchDataset method)
,
[1]
K
kl() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
kl_sym() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
L
last_observations (TrajectoryBatch attribute)
latent_mean (GaussianMLPEncoder attribute)
,
[1]
latent_space (TaskEmbeddingPolicy attribute)
,
[1]
latent_std_param (GaussianMLPEncoder attribute)
,
[1]
launch() (DmControlViewer method)
,
[1]
LazyDict (class in garage.tf.optimizers.utils)
LbfgsOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.lbfgs_optimizer)
lengths (TrajectoryBatch attribute)
likelihood_ratio_sym() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
LinearFeatureBaseline (class in garage.np.baselines)
(class in garage.np.baselines.linear_feature_baseline)
LinearMultiFeatureBaseline (class in garage.np.baselines)
(class in garage.np.baselines.linear_multi_feature_baseline)
load() (Snapshotter method)
,
[1]
LocalRunner (class in garage.experiment)
(class in garage.experiment.local_runner)
LocalSampler (class in garage.sampler)
(class in garage.sampler.local_sampler)
LocalTFRunner (class in garage.experiment)
(class in garage.experiment.local_tf_runner)
log_diagnostics() (Baseline method)
,
[1]
(GridWorldEnv method)
,
[1]
(LocalRunner method)
,
[1]
(NPO method)
,
[1]
(Policy method)
,
[1]
,
[2]
,
[3]
(QFunction method)
,
[1]
(REPS method)
,
[1]
log_likelihood() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
log_likelihood_sym() (Bernoulli method)
,
[1]
(BernoulliMLPRegressor method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(RecurrentCategorical method)
,
[1]
(StochasticRegressor method)
,
[1]
log_multitask_performance() (in module garage)
log_parameters() (in module garage.experiment.experiment_wrapper)
log_performance() (in module garage)
(MAML method)
log_prob() (TanhNormal method)
,
[1]
LogEncoder (class in garage.experiment.experiment)
loss() (ConjugateGradientOptimizer method)
,
[1]
(FirstOrderOptimizer method)
,
[1]
(LbfgsOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
lstm() (in module garage.tf.models.lstm)
LSTMModel (class in garage.tf.models)
(class in garage.tf.models.lstm_model)
M
make_launcher_archive() (in module garage.experiment.experiment)
make_optimizer() (in module garage)
make_sampler() (LocalRunner method)
,
[1]
(LocalTFRunner method)
,
[1]
MAML (class in garage.torch.algos.maml)
MAMLPPO (class in garage.torch.algos)
(class in garage.torch.algos.maml_ppo)
MAMLTrajectoryBatch (class in garage.torch.algos.maml)
MAMLTRPO (class in garage.torch.algos)
(class in garage.torch.algos.maml_trpo)
MAMLVPG (class in garage.torch.algos)
(class in garage.torch.algos.maml_vpg)
max_path_length (RL2 attribute)
,
[1]
MaxAndSkip (class in garage.envs.wrappers)
(class in garage.envs.wrappers.max_and_skip)
mean (TanhNormal attribute)
,
[1]
MetaEvaluator (class in garage.experiment)
(class in garage.experiment.meta_evaluator)
MetaRLAlgorithm (class in garage.np.algos)
(class in garage.np.algos.meta_rl_algorithm)
mlp() (in module garage.tf.models.mlp)
MLPDuelingModel (class in garage.tf.models)
(class in garage.tf.models.mlp_dueling_model)
MLPEncoder (class in garage.torch.embeddings)
(class in garage.torch.embeddings.mlp_encoder)
MLPMergeModel (class in garage.tf.models)
(class in garage.tf.models.mlp_merge_model)
MLPModel (class in garage.tf.models)
(class in garage.tf.models.mlp_model)
MLPModule (class in garage.torch.modules)
(class in garage.torch.modules.mlp_module)
Model (class in garage.tf.models)
(class in garage.tf.models.model)
Module (class in garage.tf.models)
(class in garage.tf.models.module)
MTSAC (class in garage.torch.algos)
(class in garage.torch.algos.mtsac)
MultiEnvWrapper (class in garage.envs)
(class in garage.envs.multi_env_wrapper)
MultiHeadedMLPModule (class in garage.torch.modules)
(class in garage.torch.modules.multi_headed_mlp_module)
MultiprocessingSampler (class in garage.sampler)
(class in garage.sampler.multiprocessing_sampler)
N
n_tasks (ConstructEnvsSampler attribute)
(EnvPoolSampler attribute)
(SetTaskSampler attribute)
(TaskSampler attribute)
,
[1]
,
[2]
,
[3]
n_transitions_stored (PathBuffer attribute)
,
[1]
(ReplayBuffer attribute)
,
[1]
name (BaseModel attribute)
,
[1]
(Model attribute)
,
[1]
(Module attribute)
,
[1]
(Policy attribute)
,
[1]
Network (class in garage.tf.models.model)
network_input_spec() (CNNMLPMergeModel method)
,
[1]
(GRUModel method)
,
[1]
(GaussianGRUModel method)
,
[1]
(GaussianLSTMModel method)
,
[1]
(LSTMModel method)
,
[1]
(MLPMergeModel method)
,
[1]
(Model method)
,
[1]
network_output_spec() (CategoricalCNNModel method)
,
[1]
(CategoricalGRUModel method)
,
[1]
(CategoricalLSTMModel method)
,
[1]
(CategoricalMLPModel method)
,
[1]
(CategoricalMLPRegressorModel method)
(GRUModel method)
,
[1]
(GaussianCNNModel method)
,
[1]
(GaussianCNNRegressorModel method)
,
[1]
(GaussianGRUModel method)
,
[1]
(GaussianLSTMModel method)
,
[1]
(GaussianMLPModel method)
,
[1]
(GaussianMLPRegressorModel method)
(LSTMModel method)
,
[1]
(Model method)
,
[1]
(NormalizedInputMLPModel method)
,
[1]
networks (ContextConditionedPolicy attribute)
,
[1]
(PEARL attribute)
,
[1]
(SAC attribute)
,
[1]
new_tensor() (in module garage.tf.misc.tensor_utils)
new_tensor_like() (in module garage.tf.misc.tensor_utils)
NewEnvUpdate (class in garage.sampler.env_update)
next_observation (TimeStepBatch attribute)
Noop (class in garage.envs.wrappers)
(class in garage.envs.wrappers.noop)
NOP (class in garage.np.algos)
(class in garage.np.algos.nop)
NoResetPolicy (class in garage.tf.algos.rl2)
normalize (in module garage.envs)
(in module garage.envs.normalized_env)
normalize_pixel_batch() (in module garage.misc.tensor_utils)
NormalizedEnv (class in garage.envs.normalized_env)
NormalizedInputMLPModel (class in garage.tf.models)
(class in garage.tf.models.normalized_input_mlp_model)
NotAFileError
NotSetupError
NPO (class in garage.tf.algos)
(class in garage.tf.algos.npo)
num_envs (ParallelVecEnvExecutor attribute)
,
[1]
(VecEnvExecutor attribute)
,
[1]
num_tasks (MultiEnvWrapper attribute)
,
[1]
number_batches (BatchDataset attribute)
,
[1]
O
observation (TimeStep attribute)
observation_space (DmControlEnv attribute)
,
[1]
(EnvSpec attribute)
,
[1]
(Grayscale attribute)
,
[1]
(GridWorldEnv attribute)
,
[1]
(MultiEnvWrapper attribute)
,
[1]
(ParallelVecEnvExecutor attribute)
,
[1]
(PointEnv attribute)
,
[1]
,
[2]
,
[3]
(Policy attribute)
,
[1]
,
[2]
,
[3]
,
[4]
,
[5]
(Resize attribute)
,
[1]
(StackFrames attribute)
,
[1]
(VecEnvExecutor attribute)
,
[1]
observations (MAMLTrajectoryBatch attribute)
(TimeStepBatch attribute)
(TrajectoryBatch attribute)
obtain_evaluation_samples() (in module garage.np)
obtain_exact_trajectories() (LocalSampler method)
,
[1]
(MultiprocessingSampler method)
,
[1]
(RaySampler method)
,
[1]
obtain_samples() (BatchSampler method)
,
[1]
,
[2]
,
[3]
(ISSampler method)
,
[1]
(LocalRunner method)
,
[1]
(LocalSampler method)
,
[1]
(MultiprocessingSampler method)
,
[1]
(OffPolicyVectorizedSampler method)
,
[1]
(OnPolicyVectorizedSampler method)
,
[1]
(RaySampler method)
,
[1]
(Sampler method)
,
[1]
,
[2]
OffPolicyVectorizedSampler (class in garage.sampler)
(class in garage.sampler.off_policy_vectorized_sampler)
OnPolicyVectorizedSampler (class in garage.sampler)
(class in garage.sampler.on_policy_vectorized_sampler)
optimize() (ConjugateGradientOptimizer method)
,
[1]
(FirstOrderOptimizer method)
,
[1]
(LbfgsOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
optimize_policy() (DDPG method)
,
[1]
,
[2]
,
[3]
(DQN method)
,
[1]
(NOP method)
,
[1]
(NPO method)
,
[1]
(REPS method)
,
[1]
(SAC method)
,
[1]
(TD3 method)
,
[1]
(TENPO method)
,
[1]
OptimizerWrapper (class in garage.torch.optimizers)
(class in garage.torch.optimizers.optimizer_wrapper)
output (Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
output_dim (Encoder attribute)
,
[1]
(GaussianMLPEncoder attribute)
,
[1]
(MLPEncoder attribute)
,
[1]
(MLPModule attribute)
,
[1]
output_space (InOutSpec attribute)
outputs (Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
P
pad_tensor() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
pad_tensor_dict() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
pad_tensor_n() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
pad_to_last() (in module garage.torch)
ParallelVecEnvExecutor (class in garage.sampler)
(class in garage.sampler.parallel_vec_env_executor)
parameter() (in module garage.tf.models.parameter)
parameters (BaseModel attribute)
,
[1]
(Model attribute)
,
[1]
PathBuffer (class in garage.replay_buffer)
(class in garage.replay_buffer.path_buffer)
paths (MAMLTrajectoryBatch attribute)
paths_to_tensors() (in module garage.np)
(TENPO method)
,
[1]
(in module garage.tf)
PEARL (class in garage.torch.algos)
(class in garage.torch.algos.pearl)
PearlmutterHvp (class in garage.tf.optimizers.conjugate_gradient_optimizer)
PEARLWorker (class in garage.torch.algos.pearl)
PenaltyLbfgsOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.penalty_lbfgs_optimizer)
Plotter (class in garage.plotter)
(class in garage.plotter.plotter)
(class in garage.tf.plotter)
(class in garage.tf.plotter.plotter)
PointEnv (class in garage.envs)
(class in garage.envs.point_env)
Policy (class in garage.np.policies)
(class in garage.np.policies.policy)
(class in garage.tf.policies)
(class in garage.tf.policies.policy)
(class in garage.torch.policies)
(class in garage.torch.policies.policy)
policy (MAML attribute)
(PEARL attribute)
,
[1]
(RL2 attribute)
,
[1]
populate_task() (in module garage.sampler.parallel_sampler)
positive_advs() (in module garage.tf.misc.tensor_utils)
PPO (class in garage.tf.algos)
(class in garage.tf.algos.ppo)
(class in garage.torch.algos)
(class in garage.torch.algos.ppo)
predict() (Baseline method)
,
[1]
(BernoulliMLPRegressor method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(ContinuousMLPRegressor method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(GaussianMLPRegressor method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(Regressor method)
,
[1]
(ZeroBaseline method)
,
[1]
predict_log_likelihood() (BernoulliMLPRegressor method)
,
[1]
predict_n() (ZeroBaseline method)
,
[1]
predict_sym() (ContinuousMLPRegressor method)
,
[1]
prepare_worker_messages() (WorkerFactory method)
,
[1]
process_samples() (VPG method)
,
[1]
product_of_gaussians() (in module garage.torch)
Q
q_vals (DiscreteCNNQFunction attribute)
,
[1]
(DiscreteMLPQFunction attribute)
,
[1]
QFunction (class in garage.np.q_functions)
(class in garage.np.q_functions.q_function)
(class in garage.tf.q_functions)
(class in garage.tf.q_functions.q_function)
R
RaySampler (class in garage.sampler)
(class in garage.sampler.ray_sampler)
recurrent (BernoulliMLPRegressor attribute)
,
[1]
(CategoricalMLPRegressor attribute)
,
[1]
(ContinuousMLPRegressor attribute)
,
[1]
(GaussianCNNRegressor attribute)
,
[1]
recurrent_parameter() (in module garage.tf.models.parameter)
RecurrentCategorical (class in garage.tf.distributions)
(class in garage.tf.distributions.recurrent_categorical)
RecurrentDiagonalGaussian (in module garage.tf.distributions)
Regressor (class in garage.tf.regressors)
(class in garage.tf.regressors.regressor)
render() (DmControlEnv method)
,
[1]
(DmControlViewer method)
,
[1]
(GridWorldEnv method)
,
[1]
(PointEnv method)
,
[1]
ReplayBuffer (class in garage.replay_buffer)
(class in garage.replay_buffer.replay_buffer)
REPS (class in garage.tf.algos)
(class in garage.tf.algos.reps)
reset() (AddGaussianNoise method)
,
[1]
(AddOrnsteinUhlenbeckNoise method)
,
[1]
(AtariEnv method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(ClipReward method)
,
[1]
(DmControlEnv method)
,
[1]
(Encoder method)
,
[1]
(EpisodicLife method)
,
[1]
(ExplorationPolicy method)
,
[1]
(FireReset method)
,
[1]
(FixedPolicy method)
,
[1]
(GarageEnv method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(Grayscale method)
,
[1]
(GridWorldEnv method)
,
[1]
(MLPEncoder method)
,
[1]
(MaxAndSkip method)
,
[1]
(Module method)
,
[1]
(MultiEnvWrapper method)
,
[1]
(NoResetPolicy method)
(Noop method)
,
[1]
(NormalizedEnv method)
(ParallelVecEnvExecutor method)
,
[1]
(PointEnv method)
,
[1]
(Policy method)
,
[1]
,
[2]
,
[3]
(RL2AdaptedPolicy method)
(RL2Env method)
(Resize method)
,
[1]
(ScriptedPolicy method)
,
[1]
(StackFrames method)
,
[1]
(TaskOnehotWrapper method)
,
[1]
(VecEnvExecutor method)
,
[1]
reset_belief() (ContextConditionedPolicy method)
,
[1]
Resize (class in garage.envs.wrappers)
(class in garage.envs.wrappers.resize)
restore() (LocalRunner method)
,
[1]
resume() (LocalRunner method)
,
[1]
reward (TimeStep attribute)
rewards (MAMLTrajectoryBatch attribute)
(TimeStepBatch attribute)
(TrajectoryBatch attribute)
RL2 (class in garage.tf.algos)
(class in garage.tf.algos.rl2)
RL2AdaptedPolicy (class in garage.tf.algos.rl2)
RL2Env (class in garage.tf.algos.rl2)
RL2PPO (class in garage.tf.algos)
(class in garage.tf.algos.rl2ppo)
RL2TRPO (class in garage.tf.algos)
(class in garage.tf.algos.rl2trpo)
RL2Worker (class in garage.tf.algos.rl2)
RLAlgorithm (class in garage.np.algos)
(class in garage.np.algos.rl_algorithm)
rollout() (DefaultWorker method)
,
[1]
(PEARLWorker method)
(RL2Worker method)
(SamplerWorker method)
(TFWorkerWrapper method)
,
[1]
(Worker method)
,
[1]
(in module garage.sampler.utils)
round_robin_strategy() (in module garage.envs.multi_env_wrapper)
rrse() (in module garage.misc.tensor_utils)
rsample() (TanhNormal method)
,
[1]
rsample_with_pre_tanh_value() (TanhNormal method)
,
[1]
run_collect() (StatefulPool method)
run_each() (StatefulPool method)
run_experiment() (in module garage.experiment)
(in module garage.experiment.experiment)
(in module garage.experiment.experiment_wrapper)
run_imap_unordered() (StatefulPool method)
run_map() (StatefulPool method)
run_worker() (in module garage.sampler.multiprocessing_sampler)
S
SAC (class in garage.torch.algos)
(class in garage.torch.algos.sac)
sample() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(ConstructEnvsSampler method)
(DiagonalGaussian method)
,
[1]
(EnvPoolSampler method)
(ReplayBuffer method)
,
[1]
(SetTaskSampler method)
(TanhNormal method)
,
[1]
(TaskSampler method)
,
[1]
sample_from_belief() (ContextConditionedPolicy method)
,
[1]
sample_path() (PathBuffer method)
,
[1]
sample_paths() (in module garage.sampler.parallel_sampler)
sample_predict() (BernoulliMLPRegressor method)
,
[1]
sample_sym() (Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
sample_tasks() (HalfCheetahDirEnv method)
,
[1]
(HalfCheetahVelEnv method)
,
[1]
(PointEnv method)
,
[1]
sample_transitions() (PathBuffer method)
,
[1]
Sampler (class in garage.sampler)
(class in garage.sampler.sampler)
(class in garage.sampler.sampler_deprecated)
SamplerWorker (class in garage.sampler.ray_sampler)
samples_to_tensors() (in module garage.np)
save() (LocalRunner method)
,
[1]
save_itr_params() (Snapshotter method)
,
[1]
ScriptedPolicy (class in garage.np.policies)
(class in garage.np.policies.scripted_policy)
Sequential (class in garage.tf.models)
(class in garage.tf.models.sequential)
set() (LazyDict method)
set_gpu_mode() (in module garage.torch)
set_param_values() (Baseline method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(ExplorationPolicy method)
,
[1]
(FixedPolicy method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(Module method)
,
[1]
(NoResetPolicy method)
(Policy method)
,
[1]
(RL2AdaptedPolicy method)
(ScriptedPolicy method)
,
[1]
(ZeroBaseline method)
,
[1]
set_seed() (in module garage.experiment.deterministic)
(in module garage.sampler.parallel_sampler)
set_task() (HalfCheetahDirEnv method)
,
[1]
(HalfCheetahVelEnv method)
,
[1]
(PointEnv method)
,
[1]
SetTaskSampler (class in garage.experiment.task_sampler)
SetTaskUpdate (class in garage.sampler.env_update)
setup() (LocalRunner method)
,
[1]
(LocalTFRunner method)
,
[1]
SetupArgs (class in garage.experiment.local_runner)
SharedGlobal (class in garage.sampler.stateful_pool)
shutdown() (DefaultWorker method)
,
[1]
(SamplerWorker method)
(TFWorkerWrapper method)
,
[1]
(VecWorker method)
,
[1]
(Worker method)
,
[1]
shutdown_worker() (BatchSampler method)
,
[1]
,
[2]
,
[3]
(LocalSampler method)
,
[1]
(MultiprocessingSampler method)
,
[1]
(OffPolicyVectorizedSampler method)
,
[1]
(OnPolicyVectorizedSampler method)
,
[1]
(RaySampler method)
,
[1]
(Sampler method)
,
[1]
,
[2]
slice_nested_dict() (in module garage.misc.tensor_utils)
sliced_fun() (in module garage.tf.optimizers.utils)
sliding_window() (in module garage.misc.tensor_utils)
snapshot_dir (SnapshotConfig attribute)
,
[1]
(Snapshotter attribute)
,
[1]
snapshot_gap (SnapshotConfig attribute)
,
[1]
(Snapshotter attribute)
,
[1]
snapshot_mode (SnapshotConfig attribute)
,
[1]
(Snapshotter attribute)
,
[1]
SnapshotConfig (class in garage.experiment)
(class in garage.experiment.snapshotter)
Snapshotter (class in garage.experiment)
(class in garage.experiment.snapshotter)
spec (Encoder attribute)
,
[1]
(GarageEnv attribute)
,
[1]
(GaussianMLPEncoder attribute)
,
[1]
(MLPEncoder attribute)
,
[1]
(MultiEnvWrapper attribute)
,
[1]
(RL2Env attribute)
(TaskOnehotWrapper attribute)
,
[1]
split() (TimeStepBatch method)
(TrajectoryBatch method)
split_augmented_observation() (TaskEmbeddingPolicy method)
,
[1]
split_tensor_dict_list() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
stack_and_pad_tensor_dict_list() (in module garage.misc.tensor_utils)
stack_tensor_dict_list() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
StackFrames (class in garage.envs.wrappers)
(class in garage.envs.wrappers.stack_frames)
start() (Plotter method)
,
[1]
start_rollout() (DefaultWorker method)
,
[1]
(PEARLWorker method)
(RL2Worker method)
(TFWorkerWrapper method)
,
[1]
(TaskEmbeddingWorker method)
(VecWorker method)
,
[1]
(Worker method)
,
[1]
start_worker() (BatchSampler method)
,
[1]
,
[2]
,
[3]
(OffPolicyVectorizedSampler method)
,
[1]
(OnPolicyVectorizedSampler method)
,
[1]
(RaySampler method)
,
[1]
(Sampler method)
,
[1]
,
[2]
state (ConjugateGradientOptimizer attribute)
,
[1]
state_info_keys (Module attribute)
,
[1]
(Policy attribute)
,
[1]
state_info_specs (CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(Module attribute)
,
[1]
StatefulPool (class in garage.sampler.stateful_pool)
step() (AtariEnv method)
,
[1]
(ClipReward method)
,
[1]
(ConjugateGradientOptimizer method)
,
[1]
(DifferentiableSGD method)
,
[1]
(DmControlEnv method)
,
[1]
(EpisodicLife method)
,
[1]
(FireReset method)
,
[1]
(GarageEnv method)
,
[1]
(Grayscale method)
,
[1]
(GridWorldEnv method)
,
[1]
(HalfCheetahDirEnv method)
,
[1]
(HalfCheetahVelEnv method)
,
[1]
Step() (in module garage.envs)
(in module garage.envs.step)
step() (MaxAndSkip method)
,
[1]
(MultiEnvWrapper method)
,
[1]
(Noop method)
,
[1]
(NormalizedEnv method)
(OptimizerWrapper method)
,
[1]
(ParallelVecEnvExecutor method)
,
[1]
(PointEnv method)
,
[1]
(RL2Env method)
(Resize method)
,
[1]
(StackFrames method)
,
[1]
(TaskOnehotWrapper method)
,
[1]
(VecEnvExecutor method)
,
[1]
step_epochs() (LocalRunner method)
,
[1]
step_rollout() (DefaultWorker method)
,
[1]
(PEARLWorker method)
(TFWorkerWrapper method)
,
[1]
(TaskEmbeddingWorker method)
(VecWorker method)
,
[1]
(Worker method)
,
[1]
StochasticEncoder (class in garage.np.embeddings)
(class in garage.np.embeddings.encoder)
(class in garage.tf.embeddings)
(class in garage.tf.embeddings.encoder)
StochasticModule (class in garage.tf.models)
(class in garage.tf.models.module)
StochasticPolicy (class in garage.np.policies)
(class in garage.np.policies.policy)
(class in garage.tf.policies)
(class in garage.tf.policies.policy)
(class in garage.torch.policies.stochastic_policy)
StochasticRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.regressor)
store_episode() (ReplayBuffer method)
,
[1]
T
TanhGaussianMLPPolicy (class in garage.torch.policies)
(class in garage.torch.policies.tanh_gaussian_mlp_policy)
TanhNormal (class in garage.torch.distributions)
(class in garage.torch.distributions.tanh_normal)
task_space (MultiEnvWrapper attribute)
,
[1]
(TaskEmbeddingPolicy attribute)
,
[1]
TaskEmbeddingPolicy (class in garage.tf.policies)
(class in garage.tf.policies.task_embedding_policy)
TaskEmbeddingWorker (class in garage.tf.algos.te)
TaskOnehotWrapper (class in garage.envs)
(class in garage.envs.task_onehot_wrapper)
TaskSampler (class in garage.experiment)
(class in garage.experiment.task_sampler)
TD3 (class in garage.tf.algos)
(class in garage.tf.algos.td3)
TENPO (class in garage.tf.algos)
(class in garage.tf.algos.te_npo)
TEPPO (class in garage.tf.algos)
(class in garage.tf.algos.te_ppo)
terminals (TimeStep attribute)
(TimeStepBatch attribute)
(TrajectoryBatch attribute)
terminate() (Module method)
,
[1]
(Policy method)
,
[1]
terminate_task() (in module garage.sampler.parallel_sampler)
TFWorkerClassWrapper (class in garage.tf.samplers)
(class in garage.tf.samplers.worker)
TFWorkerWrapper (class in garage.tf.samplers)
(class in garage.tf.samplers.worker)
TimeStep (class in garage)
TimeStepBatch (class in garage)
TNPG (class in garage.tf.algos)
(class in garage.tf.algos.tnpg)
to() (GaussianMLPBaseModule method)
(MTSAC method)
,
[1]
(PEARL method)
,
[1]
(SAC method)
,
[1]
to_local_command() (in module garage.experiment)
(in module garage.experiment.experiment)
to_time_step_list() (TimeStepBatch method)
to_trajectory_list() (TrajectoryBatch method)
torch_to_np() (in module garage.torch)
total_env_steps (LocalRunner attribute)
,
[1]
train() (CEM method)
,
[1]
(CMAES method)
,
[1]
(DDPG method)
,
[1]
,
[2]
,
[3]
(DQN method)
,
[1]
(LocalRunner method)
,
[1]
(MAML method)
(NOP method)
,
[1]
(NPO method)
,
[1]
(PEARL method)
,
[1]
(REPS method)
,
[1]
(RL2 method)
,
[1]
(RLAlgorithm method)
,
[1]
(SAC method)
,
[1]
(TD3 method)
,
[1]
(TENPO method)
,
[1]
(VPG method)
,
[1]
train_once() (CEM method)
,
[1]
(CMAES method)
,
[1]
(DDPG method)
,
[1]
,
[2]
,
[3]
(DQN method)
,
[1]
(MAML method)
(NPO method)
,
[1]
(REPS method)
,
[1]
(RL2 method)
,
[1]
(SAC method)
,
[1]
(TD3 method)
,
[1]
(TENPO method)
,
[1]
(VPG method)
,
[1]
TrainArgs (class in garage.experiment.local_runner)
TrajectoryBatch (class in garage)
TRPO (class in garage.tf.algos)
(class in garage.tf.algos.trpo)
(class in garage.torch.algos)
(class in garage.torch.algos.trpo)
truncate_paths() (in module garage.sampler.utils)
truncate_tensor_dict() (in module garage.misc.tensor_utils)
U
unflatten_tensors() (in module garage.misc.tensor_utils)
uniform_random_strategy() (in module garage.envs.multi_env_wrapper)
UniformControlPolicy (class in garage.tf.policies.uniform_control_policy)
update() (BatchDataset method)
,
[1]
(SamplerWorker method)
update_agent() (DefaultWorker method)
,
[1]
(TFWorkerWrapper method)
,
[1]
(VecWorker method)
,
[1]
(Worker method)
,
[1]
update_context() (ContextConditionedPolicy method)
,
[1]
update_env() (DefaultWorker method)
,
[1]
(TFWorkerWrapper method)
,
[1]
(VecWorker method)
,
[1]
(Worker method)
,
[1]
update_hvp() (FiniteDifferenceHvp method)
,
[1]
(HessianVectorProduct method)
(PearlmutterHvp method)
update_module_params() (in module garage.torch)
update_opt() (ConjugateGradientOptimizer method)
,
[1]
(FirstOrderOptimizer method)
,
[1]
(LbfgsOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
update_plot() (Plotter method)
,
[1]
,
[2]
,
[3]
update_target() (DDPG method)
,
[1]
V
valids (MAMLTrajectoryBatch attribute)
ValueFunction (class in garage.torch.value_functions)
(class in garage.torch.value_functions.value_function)
variance (TanhNormal attribute)
,
[1]
VecEnvExecutor (class in garage.sampler)
(class in garage.sampler.vec_env_executor)
vectorized (BernoulliMLPRegressor attribute)
,
[1]
(CategoricalCNNPolicy attribute)
,
[1]
(CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(CategoricalMLPPolicy attribute)
,
[1]
(CategoricalMLPRegressor attribute)
,
[1]
(ContinuousMLPPolicy attribute)
,
[1]
(ContinuousMLPRegressor attribute)
,
[1]
(DiscreteQfDerivedPolicy attribute)
,
[1]
(GaussianCNNRegressor attribute)
,
[1]
(GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(GaussianMLPEncoder attribute)
,
[1]
(GaussianMLPPolicy attribute)
,
[1]
(GaussianMLPRegressor attribute)
,
[1]
(Module attribute)
,
[1]
(Policy attribute)
,
[1]
(UniformControlPolicy attribute)
VecWorker (class in garage.sampler)
(class in garage.sampler.vec_worker)
viewer_setup() (HalfCheetahEnvMetaBase method)
visualize_distribution() (TENPO method)
,
[1]
VPG (class in garage.tf.algos)
(class in garage.tf.algos.vpg)
(class in garage.torch.algos)
(class in garage.torch.algos.vpg)
W
Worker (class in garage.sampler)
(class in garage.sampler.worker)
worker_init() (DefaultWorker method)
,
[1]
(TFWorkerWrapper method)
,
[1]
worker_init_envs() (in module garage.sampler.parallel_vec_env_executor)
worker_init_tf() (in module garage.tf.samplers.batch_sampler)
worker_init_tf_vars() (in module garage.tf.samplers.batch_sampler)
worker_run_reset() (in module garage.sampler.parallel_vec_env_executor)
worker_run_step() (in module garage.sampler.parallel_vec_env_executor)
WorkerFactory (class in garage.sampler)
(class in garage.sampler.worker_factory)
wrap_env_cons_list() (garage.envs.task_onehot_wrapper.TaskOnehotWrapper class method)
(garage.envs.TaskOnehotWrapper class method)
wrap_env_list() (garage.envs.task_onehot_wrapper.TaskOnehotWrapper class method)
(garage.envs.TaskOnehotWrapper class method)
wrap_experiment() (in module garage)
(in module garage.experiment.experiment)
Z
zero_grad() (DifferentiableSGD method)
,
[1]
(OptimizerWrapper method)
,
[1]
ZeroBaseline (class in garage.np.baselines)
(class in garage.np.baselines.zero_baseline)
Read the Docs
v: v2020.06.0
Versions
latest
stable
v2020.06.0
v2019.10.1
v2019.10.0
v2019.02.2
v2019.02.1
v2019.02.0
v2018.10.1
v2018.10.0
Downloads
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.