garage
v2019.10.2
Installation
Running Experiments
Implementing New Environments
Implementing New Algorithms (Basic)
Implementing New Algorithms (Advanced)
garage
Docs
»
Index
Edit on GitHub
Index
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
K
|
L
|
M
|
N
|
O
|
P
|
Q
|
R
|
S
|
T
|
U
|
V
|
W
|
Z
A
action_from_direction() (GridWorldEnv static method)
,
[1]
action_space (GridWorldEnv attribute)
,
[1]
(ParallelVecEnvExecutor attribute)
(PointEnv attribute)
,
[1]
,
[2]
,
[3]
(Policy attribute)
,
[1]
,
[2]
,
[3]
,
[4]
,
[5]
(VecEnvExecutor attribute)
active_task_index (MultiEnvWrapper attribute)
active_task_one_hot (MultiEnvWrapper attribute)
add() (VariantGenerator method)
,
[1]
add_history() (ISSampler method)
add_path() (PathBuffer method)
,
[1]
add_transition() (ReplayBuffer method)
add_transitions() (ReplayBuffer method)
algorithm_parallelized (Baseline attribute)
,
[1]
AtariEnv (class in garage.envs.wrappers)
(class in garage.envs.wrappers.atari_env)
AttrDict (class in garage.experiment.experiment)
B
Baseline (class in garage.np.baselines)
(class in garage.np.baselines.base)
BaseModel (class in garage.tf.models.base)
BaseSampler (class in garage.sampler.base)
BatchDataset (class in garage.np.optimizers)
(class in garage.np.optimizers.minibatch_dataset)
BatchSampler (class in garage.sampler.batch_sampler)
Bernoulli (class in garage.tf.distributions)
(class in garage.tf.distributions.bernoulli)
BernoulliMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.bernoulli_mlp_regressor)
build() (BaseModel method)
(Model method)
,
[1]
build_eval() (HessianVectorProduct method)
C
Categorical (class in garage.tf.distributions)
(class in garage.tf.distributions.categorical)
CategoricalCNNPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_cnn_policy)
CategoricalGRUPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_gru_policy)
CategoricalLSTMPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_lstm_policy)
CategoricalMLPPolicy (class in garage.tf.policies)
(class in garage.tf.policies.categorical_mlp_policy)
CategoricalMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.categorical_mlp_regressor)
center_advs() (in module garage.tf.misc.tensor_utils)
cg() (in module garage.tf.optimizers.conjugate_gradient_optimizer)
ClipReward (class in garage.envs.wrappers)
(class in garage.envs.wrappers.clip_reward)
clone() (CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(ContinuousMLPQFunction method)
,
[1]
(DiscreteCNNQFunction method)
,
[1]
(DiscreteMLPQFunction method)
,
[1]
(QFunction method)
,
[1]
close() (DmControlViewer method)
(GarageEnv method)
,
[1]
(MultiEnvWrapper method)
(ParallelVecEnvExecutor method)
(Plotter method)
,
[1]
,
[2]
,
[3]
(StatefulPool method)
(VecEnvExecutor method)
(in module garage.sampler.parallel_sampler)
cnn() (in module garage.tf.models.cnn)
cnn_with_max_pooling() (in module garage.tf.models.cnn)
CNNModel (class in garage.tf.models)
(class in garage.tf.models.cnn_model)
CNNModelWithMaxPooling (class in garage.tf.models)
(class in garage.tf.models.cnn_model_max_pooling)
compile_function() (in module garage.tf.misc.tensor_utils)
compute_advantages() (in module garage.tf.misc.tensor_utils)
concat_tensor_dict_list() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
concat_tensor_list() (in module garage.tf.misc.tensor_utils)
ConjugateGradientOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.conjugate_gradient_optimizer)
constraint_val() (ConjugateGradientOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
ContinuousMLPBaseline (class in garage.tf.baselines)
(class in garage.tf.baselines.continuous_mlp_baseline)
ContinuousMLPPolicy (class in garage.tf.policies)
(class in garage.tf.policies.continuous_mlp_policy)
ContinuousMLPQFunction (class in garage.tf.q_functions)
(class in garage.tf.q_functions.continuous_mlp_q_function)
(class in garage.torch.q_functions)
(class in garage.torch.q_functions.continuous_mlp_q_function)
ContinuousMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.continuous_mlp_regressor)
cross_entropy_sym() (Categorical method)
,
[1]
D
DeterministicMLPPolicy (class in garage.torch.policies)
(class in garage.torch.policies.deterministic_mlp_policy)
DiagonalGaussian (class in garage.tf.distributions)
(class in garage.tf.distributions.diagonal_gaussian)
dim (Bernoulli attribute)
,
[1]
(Categorical attribute)
,
[1]
(DiagonalGaussian attribute)
,
[1]
(Distribution attribute)
,
[1]
(RecurrentCategorical attribute)
,
[1]
disable() (Plotter static method)
,
[1]
,
[2]
,
[3]
discount_cumsum() (in module garage.misc.tensor_utils)
discounted_returns() (in module garage.tf.misc.tensor_utils)
DiscreteCNNQFunction (class in garage.tf.q_functions)
(class in garage.tf.q_functions.discrete_cnn_q_function)
DiscreteMLPQFunction (class in garage.tf.q_functions)
(class in garage.tf.q_functions.discrete_mlp_q_function)
DiscreteQfDerivedPolicy (class in garage.tf.policies)
(class in garage.tf.policies.discrete_qf_derived_policy)
dist_info() (CategoricalCNNPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(StochasticPolicy method)
,
[1]
,
[2]
,
[3]
dist_info_keys (Bernoulli attribute)
,
[1]
(Distribution attribute)
,
[1]
dist_info_specs (Categorical attribute)
,
[1]
(DiagonalGaussian attribute)
,
[1]
(Distribution attribute)
,
[1]
(RecurrentCategorical attribute)
,
[1]
dist_info_sym() (BernoulliMLPRegressor method)
,
[1]
(CategoricalCNNPolicy method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
(GaussianMLPRegressor method)
,
[1]
(StochasticPolicy method)
,
[1]
(StochasticRegressor method)
,
[1]
distribution (CategoricalCNNPolicy attribute)
,
[1]
(CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(CategoricalMLPPolicy attribute)
,
[1]
Distribution (class in garage.tf.distributions)
(class in garage.tf.distributions.base)
distribution (GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(GaussianMLPPolicy attribute)
,
[1]
(StochasticPolicy attribute)
,
[1]
,
[2]
,
[3]
DmControlViewer (class in garage.envs.dm_control.dm_control_viewer)
dump() (VariantDict method)
E
enable (Plotter attribute)
,
[1]
,
[2]
,
[3]
entropy() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
entropy_sym() (Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(RecurrentCategorical method)
,
[1]
env_spec (Policy attribute)
,
[1]
EnvSpec (class in garage.envs)
(class in garage.envs.env_spec)
EpisodicLife (class in garage.envs.wrappers)
(class in garage.envs.wrappers.episodic_life)
EpsilonGreedyStrategy (class in garage.np.exploration_strategies)
(class in garage.np.exploration_strategies.epsilon_greedy_strategy)
Experiment (class in garage.experiment.nb_utils)
ExperimentDatabase (class in garage.experiment.nb_utils)
explained_variance_1d() (in module garage.misc.tensor_utils)
ExplorationStrategy (class in garage.np.exploration_strategies)
(class in garage.np.exploration_strategies.base)
F
filter_experiments() (ExperimentDatabase method)
filter_valids() (in module garage.tf.misc.tensor_utils)
filter_valids_dict() (in module garage.tf.misc.tensor_utils)
FiniteDifferenceHvp (class in garage.tf.optimizers)
(class in garage.tf.optimizers.conjugate_gradient_optimizer)
FireReset (class in garage.envs.wrappers)
(class in garage.envs.wrappers.fire_reset)
FirstOrderOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.first_order_optimizer)
fit() (Baseline method)
,
[1]
(BernoulliMLPRegressor method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(ContinuousMLPRegressor method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(GaussianMLPRegressor method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(ProductRegressor method)
,
[1]
(Regressor method)
,
[1]
(ZeroBaseline method)
,
[1]
flat_to_params() (Policy method)
,
[1]
(Regressor method)
,
[1]
flatten_batch() (in module garage.tf.misc.tensor_utils)
flatten_batch_dict() (in module garage.tf.misc.tensor_utils)
flatten_inputs() (in module garage.tf.misc.tensor_utils)
flatten_tensor_variables() (in module garage.tf.misc.tensor_utils)
flatten_tensors() (in module garage.misc.tensor_utils)
forward() (ContinuousMLPQFunction method)
,
[1]
(DeterministicMLPPolicy method)
,
[1]
(GaussianMLPBaseModule method)
(GaussianMLPPolicy method)
,
[1]
(MLPModule method)
,
[1]
(MultiHeadedMLPModule method)
,
[1]
from_onehot() (in module garage.tf.distributions.categorical)
full (ReplayBuffer attribute)
G
garage (module)
garage.envs (module)
garage.envs.base (module)
garage.envs.dm_control.dm_control_viewer (module)
garage.envs.env_spec (module)
garage.envs.grid_world_env (module)
garage.envs.multi_env_wrapper (module)
garage.envs.normalized_env (module)
garage.envs.point_env (module)
garage.envs.wrappers (module)
garage.envs.wrappers.atari_env (module)
garage.envs.wrappers.clip_reward (module)
garage.envs.wrappers.episodic_life (module)
garage.envs.wrappers.fire_reset (module)
garage.envs.wrappers.grayscale (module)
garage.envs.wrappers.max_and_skip (module)
garage.envs.wrappers.noop (module)
garage.envs.wrappers.resize (module)
garage.envs.wrappers.stack_frames (module)
garage.experiment (module)
garage.experiment.deterministic (module)
garage.experiment.experiment (module)
garage.experiment.local_runner (module)
garage.experiment.nb_utils (module)
garage.experiment.snapshotter (module)
garage.misc (module)
garage.misc.prog_bar_counter (module)
garage.misc.tensor_utils (module)
garage.np (module)
garage.np.algos.base (module)
garage.np.baselines (module)
garage.np.baselines.base (module)
garage.np.baselines.linear_feature_baseline (module)
garage.np.baselines.zero_baseline (module)
garage.np.exploration_strategies (module)
garage.np.exploration_strategies.base (module)
garage.np.exploration_strategies.epsilon_greedy_strategy (module)
garage.np.exploration_strategies.gaussian_strategy (module)
garage.np.exploration_strategies.ou_strategy (module)
garage.np.optimizers (module)
garage.np.optimizers.minibatch_dataset (module)
garage.np.policies (module)
garage.np.policies.base (module)
garage.np.policies.scripted_policy (module)
garage.np.q_functions (module)
garage.np.q_functions.base (module)
garage.np.regressors (module)
garage.np.regressors.product_regressor (module)
garage.plotter (module)
garage.plotter.plotter (module)
garage.replay_buffer (module)
garage.replay_buffer.base (module)
garage.replay_buffer.her_replay_buffer (module)
garage.replay_buffer.path_buffer (module)
garage.replay_buffer.simple_replay_buffer (module)
garage.sampler.base (module)
garage.sampler.batch_sampler (module)
garage.sampler.is_sampler (module)
garage.sampler.off_policy_vectorized_sampler (module)
garage.sampler.on_policy_vectorized_sampler (module)
garage.sampler.parallel_sampler (module)
garage.sampler.parallel_vec_env_executor (module)
garage.sampler.stateful_pool (module)
garage.sampler.utils (module)
garage.sampler.vec_env_executor (module)
garage.tf (module)
garage.tf.baselines (module)
garage.tf.baselines.continuous_mlp_baseline (module)
garage.tf.baselines.gaussian_cnn_baseline (module)
garage.tf.baselines.gaussian_mlp_baseline (module)
garage.tf.distributions (module)
garage.tf.distributions.base (module)
garage.tf.distributions.bernoulli (module)
garage.tf.distributions.categorical (module)
garage.tf.distributions.diagonal_gaussian (module)
garage.tf.distributions.recurrent_categorical (module)
garage.tf.distributions.recurrent_diagonal_gaussian (module)
garage.tf.envs (module)
garage.tf.envs.base (module)
garage.tf.experiment (module)
garage.tf.experiment.local_tf_runner (module)
garage.tf.misc (module)
garage.tf.misc.tensor_utils (module)
garage.tf.models (module)
garage.tf.models.base (module)
garage.tf.models.cnn (module)
garage.tf.models.cnn_model (module)
garage.tf.models.cnn_model_max_pooling (module)
garage.tf.models.gaussian_cnn_model (module)
garage.tf.models.gaussian_gru_model (module)
garage.tf.models.gaussian_lstm_model (module)
garage.tf.models.gaussian_mlp_model (module)
garage.tf.models.gru (module)
garage.tf.models.gru_model (module)
garage.tf.models.lstm (module)
garage.tf.models.lstm_model (module)
garage.tf.models.mlp (module)
garage.tf.models.mlp_dueling_model (module)
garage.tf.models.mlp_merge_model (module)
garage.tf.models.mlp_model (module)
garage.tf.models.normalized_input_mlp_model (module)
garage.tf.models.parameter (module)
garage.tf.models.sequential (module)
garage.tf.optimizers (module)
garage.tf.optimizers.conjugate_gradient_optimizer (module)
garage.tf.optimizers.first_order_optimizer (module)
garage.tf.optimizers.lbfgs_optimizer (module)
garage.tf.optimizers.penalty_lbfgs_optimizer (module)
garage.tf.optimizers.utils (module)
garage.tf.plotter (module)
garage.tf.plotter.plotter (module)
garage.tf.policies (module)
garage.tf.policies.base (module)
garage.tf.policies.categorical_cnn_policy (module)
garage.tf.policies.categorical_gru_policy (module)
garage.tf.policies.categorical_lstm_policy (module)
garage.tf.policies.categorical_mlp_policy (module)
garage.tf.policies.continuous_mlp_policy (module)
garage.tf.policies.discrete_qf_derived_policy (module)
garage.tf.policies.gaussian_gru_policy (module)
garage.tf.policies.gaussian_lstm_policy (module)
garage.tf.policies.gaussian_mlp_policy (module)
garage.tf.policies.uniform_control_policy (module)
garage.tf.q_functions (module)
garage.tf.q_functions.base (module)
garage.tf.q_functions.continuous_mlp_q_function (module)
garage.tf.q_functions.discrete_cnn_q_function (module)
garage.tf.q_functions.discrete_mlp_q_function (module)
garage.tf.regressors (module)
garage.tf.regressors.base (module)
garage.tf.regressors.bernoulli_mlp_regressor (module)
garage.tf.regressors.categorical_mlp_regressor (module)
garage.tf.regressors.continuous_mlp_regressor (module)
garage.tf.regressors.gaussian_cnn_regressor (module)
garage.tf.regressors.gaussian_cnn_regressor_model (module)
garage.tf.regressors.gaussian_mlp_regressor (module)
garage.tf.regressors.gaussian_mlp_regressor_model (module)
garage.torch (module)
garage.torch.modules (module)
garage.torch.modules.gaussian_mlp_module (module)
garage.torch.modules.mlp_module (module)
garage.torch.modules.multi_headed_mlp_module (module)
garage.torch.policies (module)
garage.torch.policies.base (module)
garage.torch.policies.deterministic_mlp_policy (module)
garage.torch.policies.gaussian_mlp_policy (module)
garage.torch.q_functions (module)
garage.torch.q_functions.continuous_mlp_q_function (module)
garage.torch.utils (module)
GarageEnv (class in garage.envs)
(class in garage.envs.base)
GaussianCNNBaseline (class in garage.tf.baselines)
(class in garage.tf.baselines.gaussian_cnn_baseline)
GaussianCNNModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_cnn_model)
GaussianCNNRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.gaussian_cnn_regressor)
GaussianCNNRegressorModel (class in garage.tf.regressors)
(class in garage.tf.regressors.gaussian_cnn_regressor_model)
GaussianGRUModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_gru_model)
GaussianGRUPolicy (class in garage.tf.policies)
(class in garage.tf.policies.gaussian_gru_policy)
GaussianLSTMModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_lstm_model)
GaussianLSTMPolicy (class in garage.tf.policies)
(class in garage.tf.policies.gaussian_lstm_policy)
GaussianMLPBaseline (class in garage.tf.baselines)
(class in garage.tf.baselines.gaussian_mlp_baseline)
GaussianMLPBaseModule (class in garage.torch.modules.gaussian_mlp_module)
GaussianMLPIndependentStdModule (class in garage.torch.modules)
(class in garage.torch.modules.gaussian_mlp_module)
GaussianMLPModel (class in garage.tf.models)
(class in garage.tf.models.gaussian_mlp_model)
GaussianMLPModule (class in garage.torch.modules)
(class in garage.torch.modules.gaussian_mlp_module)
GaussianMLPPolicy (class in garage.tf.policies)
(class in garage.tf.policies.gaussian_mlp_policy)
(class in garage.torch.policies)
(class in garage.torch.policies.gaussian_mlp_policy)
GaussianMLPRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.gaussian_mlp_regressor)
GaussianMLPRegressorModel (class in garage.tf.regressors.gaussian_mlp_regressor_model)
GaussianMLPTwoHeadedModule (class in garage.torch.modules)
(class in garage.torch.modules.gaussian_mlp_module)
GaussianStrategy (class in garage.np.exploration_strategies.gaussian_strategy)
get() (LazyDict method)
get_action() (CategoricalCNNPolicy method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(DeterministicMLPPolicy method)
,
[1]
(DiscreteQfDerivedPolicy method)
,
[1]
(EpsilonGreedyStrategy method)
,
[1]
(ExplorationStrategy method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
,
[2]
,
[3]
(GaussianStrategy method)
(OUStrategy method)
,
[1]
(Policy method)
,
[1]
,
[2]
,
[3]
,
[4]
,
[5]
(ScriptedPolicy method)
,
[1]
(UniformControlPolicy method)
get_action_sym() (ContinuousMLPPolicy method)
,
[1]
get_actions() (CategoricalCNNPolicy method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(CategoricalMLPPolicy method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(DeterministicMLPPolicy method)
,
[1]
(DiscreteQfDerivedPolicy method)
,
[1]
(EpsilonGreedyStrategy method)
,
[1]
(ExplorationStrategy method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
,
[2]
,
[3]
(GaussianStrategy method)
(OUStrategy method)
,
[1]
(Policy method)
,
[1]
,
[2]
,
[3]
(ScriptedPolicy method)
,
[1]
(UniformControlPolicy method)
get_entropy() (GaussianMLPPolicy method)
,
[1]
get_env_copy() (LocalRunner method)
,
[1]
get_global_vars() (Policy method)
,
[1]
(QFunction method)
,
[1]
get_history_list() (ISSampler method)
get_param_shapes() (Policy method)
,
[1]
(Regressor method)
,
[1]
get_param_values() (Baseline method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(Policy method)
,
[1]
(ProductRegressor method)
,
[1]
(Regressor method)
,
[1]
(ScriptedPolicy method)
,
[1]
(ZeroBaseline method)
,
[1]
get_params() (GaussianMLPPolicy method)
,
[1]
(Policy method)
,
[1]
(Regressor method)
,
[1]
get_params_internal() (BernoulliMLPRegressor method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(ContinuousMLPRegressor method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(GaussianMLPRegressor method)
,
[1]
(Regressor method)
,
[1]
(UniformControlPolicy method)
get_plotters() (Plotter static method)
,
[1]
,
[2]
,
[3]
get_possible_next_states() (GridWorldEnv method)
,
[1]
get_qval() (ContinuousMLPQFunction method)
,
[1]
get_qval_sym() (ContinuousMLPQFunction method)
,
[1]
(DiscreteCNNQFunction method)
,
[1]
(DiscreteMLPQFunction method)
,
[1]
(QFunction method)
,
[1]
get_regularizable_vars() (CategoricalMLPPolicy method)
,
[1]
(ContinuousMLPPolicy method)
,
[1]
(QFunction method)
,
[1]
get_seed() (in module garage.experiment.deterministic)
get_target_ops() (in module garage.tf.misc.tensor_utils)
get_trainable_vars() (Policy method)
,
[1]
(QFunction method)
,
[1]
graph_inputs() (in module garage.tf.misc.tensor_utils)
Grayscale (class in garage.envs.wrappers)
(class in garage.envs.wrappers.grayscale)
GridWorldEnv (class in garage.envs)
(class in garage.envs.grid_world_env)
gru() (in module garage.tf.models.gru)
GRUModel (class in garage.tf.models)
(class in garage.tf.models.gru_model)
H
HerReplayBuffer (class in garage.replay_buffer)
(class in garage.replay_buffer.her_replay_buffer)
HessianVectorProduct (class in garage.tf.optimizers.conjugate_gradient_optimizer)
history (ISSampler attribute)
I
inc() (ProgBarCounter method)
init_plot() (Plotter method)
,
[1]
init_worker() (Plotter method)
,
[1]
initialize() (in module garage.sampler.parallel_sampler)
(StatefulPool method)
initialize_tf_vars() (LocalTFRunner method)
,
[1]
input (DiscreteCNNQFunction attribute)
,
[1]
(DiscreteMLPQFunction attribute)
,
[1]
(Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
inputs (ContinuousMLPQFunction attribute)
,
[1]
(Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
ISSampler (class in garage.sampler.is_sampler)
iterate() (BatchDataset method)
,
[1]
ivariants() (VariantGenerator method)
,
[1]
K
kl() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
kl_sym() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
L
launch() (DmControlViewer method)
LazyDict (class in garage.tf.optimizers.utils)
LbfgsOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.lbfgs_optimizer)
likelihood_ratio_sym() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(RecurrentCategorical method)
,
[1]
LinearFeatureBaseline (class in garage.np.baselines)
(class in garage.np.baselines.linear_feature_baseline)
load() (Snapshotter method)
,
[1]
LocalRunner (class in garage.experiment)
(class in garage.experiment.local_runner)
LocalTFRunner (class in garage.tf.experiment)
(class in garage.tf.experiment.local_tf_runner)
log_diagnostics() (Baseline method)
,
[1]
(GridWorldEnv method)
,
[1]
(LocalRunner method)
,
[1]
(NormalizedEnv method)
(Policy method)
,
[1]
,
[2]
,
[3]
(QFunction method)
,
[1]
log_likelihood() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
(RecurrentCategorical method)
,
[1]
log_likelihood_sym() (Bernoulli method)
,
[1]
(BernoulliMLPRegressor method)
,
[1]
(Categorical method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(DiagonalGaussian method)
,
[1]
(Distribution method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(GaussianMLPRegressor method)
,
[1]
(RecurrentCategorical method)
,
[1]
(StochasticRegressor method)
,
[1]
loss() (ConjugateGradientOptimizer method)
,
[1]
(FirstOrderOptimizer method)
,
[1]
(LbfgsOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
lstm() (in module garage.tf.models.lstm)
LSTMModel (class in garage.tf.models)
(class in garage.tf.models.lstm_model)
M
make_her_sample() (in module garage.replay_buffer.her_replay_buffer)
max_episode_steps (TfEnv attribute)
,
[1]
max_episode_steps() (NormalizedEnv method)
MaxAndSkip (class in garage.envs.wrappers)
(class in garage.envs.wrappers.max_and_skip)
mlp() (in module garage.tf.models.mlp)
MLPDuelingModel (class in garage.tf.models)
(class in garage.tf.models.mlp_dueling_model)
MLPMergeModel (class in garage.tf.models)
(class in garage.tf.models.mlp_merge_model)
MLPModel (class in garage.tf.models)
(class in garage.tf.models.mlp_model)
MLPModule (class in garage.torch.modules)
(class in garage.torch.modules.mlp_module)
Model (class in garage.tf.models)
(class in garage.tf.models.base)
MultiEnvWrapper (class in garage.envs.multi_env_wrapper)
MultiHeadedMLPModule (class in garage.torch.modules)
(class in garage.torch.modules.multi_headed_mlp_module)
N
n_transitions_stored (ReplayBuffer attribute)
name (BaseModel attribute)
(Model attribute)
,
[1]
(Policy attribute)
,
[1]
Network (class in garage.tf.models.base)
network_input_spec() (GaussianGRUModel method)
,
[1]
(GRUModel method)
,
[1]
(GaussianLSTMModel method)
,
[1]
(LSTMModel method)
,
[1]
(MLPMergeModel method)
,
[1]
(Model method)
,
[1]
network_output_spec() (GaussianCNNModel method)
,
[1]
(GRUModel method)
,
[1]
(GaussianCNNRegressorModel method)
,
[1]
(GaussianGRUModel method)
,
[1]
(GaussianLSTMModel method)
,
[1]
(GaussianMLPModel method)
,
[1]
(GaussianMLPRegressorModel method)
(LSTMModel method)
,
[1]
(Model method)
,
[1]
(NormalizedInputMLPModel method)
,
[1]
networks (Model attribute)
,
[1]
new_tensor() (in module garage.tf.misc.tensor_utils)
new_tensor_like() (in module garage.tf.misc.tensor_utils)
Noop (class in garage.envs.wrappers)
(class in garage.envs.wrappers.noop)
normalize (in module garage.envs)
(in module garage.envs.normalized_env)
normalize_pixel_batch() (in module garage.misc.tensor_utils)
NormalizedEnv (class in garage.envs.normalized_env)
NormalizedInputMLPModel (class in garage.tf.models)
(class in garage.tf.models.normalized_input_mlp_model)
np_to_torch() (in module garage.torch.utils)
num_envs (ParallelVecEnvExecutor attribute)
(VecEnvExecutor attribute)
num_tasks (MultiEnvWrapper attribute)
number_batches (BatchDataset attribute)
,
[1]
O
observation_space (Grayscale attribute)
,
[1]
(GridWorldEnv attribute)
,
[1]
(MultiEnvWrapper attribute)
(ParallelVecEnvExecutor attribute)
(PointEnv attribute)
,
[1]
,
[2]
,
[3]
(Policy attribute)
,
[1]
,
[2]
,
[3]
,
[4]
,
[5]
(Resize attribute)
,
[1]
(StackFrames attribute)
,
[1]
(VecEnvExecutor attribute)
obtain_samples() (BatchSampler method)
(ISSampler method)
(LocalRunner method)
,
[1]
(OffPolicyVectorizedSampler method)
(OnPolicyVectorizedSampler method)
(Sampler method)
OffPolicyVectorizedSampler (class in garage.sampler.off_policy_vectorized_sampler)
OnPolicyVectorizedSampler (class in garage.sampler.on_policy_vectorized_sampler)
optimize() (ConjugateGradientOptimizer method)
,
[1]
(FirstOrderOptimizer method)
,
[1]
(LbfgsOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
OUStrategy (class in garage.np.exploration_strategies)
(class in garage.np.exploration_strategies.ou_strategy)
output (Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
outputs (Model attribute)
,
[1]
(Network attribute)
(Sequential attribute)
,
[1]
P
pad_tensor() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
pad_tensor_dict() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
pad_tensor_n() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
ParallelVecEnvExecutor (class in garage.sampler.parallel_vec_env_executor)
parameter() (in module garage.tf.models.parameter)
parameters (BaseModel attribute)
(Model attribute)
,
[1]
PathBuffer (class in garage.replay_buffer)
(class in garage.replay_buffer.path_buffer)
PearlmutterHvp (class in garage.tf.optimizers.conjugate_gradient_optimizer)
PenaltyLbfgsOptimizer (class in garage.tf.optimizers)
(class in garage.tf.optimizers.penalty_lbfgs_optimizer)
plot_experiments() (ExperimentDatabase method)
(in module garage.experiment.nb_utils)
Plotter (class in garage.plotter)
(class in garage.plotter.plotter)
(class in garage.tf.plotter)
(class in garage.tf.plotter.plotter)
PointEnv (class in garage.envs)
(class in garage.envs.point_env)
Policy (class in garage.np.policies)
(class in garage.np.policies.base)
(class in garage.tf.policies)
(class in garage.tf.policies.base)
(class in garage.torch.policies)
(class in garage.torch.policies.base)
populate_task() (in module garage.sampler.parallel_sampler)
positive_advs() (in module garage.tf.misc.tensor_utils)
predict() (Baseline method)
,
[1]
(BernoulliMLPRegressor method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(ContinuousMLPRegressor method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianCNNRegressor method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(GaussianMLPRegressor method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(ProductRegressor method)
,
[1]
(Regressor method)
,
[1]
(ZeroBaseline method)
,
[1]
predict_log_likelihood() (BernoulliMLPRegressor method)
,
[1]
(CategoricalMLPRegressor method)
,
[1]
(ProductRegressor method)
,
[1]
predict_n() (ZeroBaseline method)
,
[1]
predict_sym() (ContinuousMLPRegressor method)
,
[1]
ProductRegressor (class in garage.np.regressors)
(class in garage.np.regressors.product_regressor)
ProgBarCounter (class in garage.misc.prog_bar_counter)
Q
q_vals (DiscreteCNNQFunction attribute)
,
[1]
(DiscreteMLPQFunction attribute)
,
[1]
QFunction (class in garage.np.q_functions)
(class in garage.np.q_functions.base)
(class in garage.tf.q_functions)
(class in garage.tf.q_functions.base)
R
recurrent (CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(Policy attribute)
,
[1]
,
[2]
,
[3]
recurrent_parameter() (in module garage.tf.models.parameter)
RecurrentCategorical (class in garage.tf.distributions)
(class in garage.tf.distributions.recurrent_categorical)
RecurrentDiagonalGaussian (in module garage.tf.distributions)
Regressor (class in garage.tf.regressors)
(class in garage.tf.regressors.base)
render() (DmControlViewer method)
(GridWorldEnv method)
,
[1]
(NormalizedEnv method)
(PointEnv method)
,
[1]
ReplayBuffer (class in garage.replay_buffer.base)
reset() (AtariEnv method)
,
[1]
(CategoricalGRUPolicy method)
,
[1]
(CategoricalLSTMPolicy method)
,
[1]
(ClipReward method)
,
[1]
(DeterministicMLPPolicy method)
,
[1]
(EpisodicLife method)
,
[1]
(ExplorationStrategy method)
,
[1]
(FireReset method)
,
[1]
(GarageEnv method)
,
[1]
(GaussianGRUPolicy method)
,
[1]
(GaussianLSTMPolicy method)
,
[1]
(GaussianMLPPolicy method)
,
[1]
(Grayscale method)
,
[1]
(GridWorldEnv method)
,
[1]
(MaxAndSkip method)
,
[1]
(MultiEnvWrapper method)
(Noop method)
,
[1]
(NormalizedEnv method)
(OUStrategy method)
,
[1]
(ParallelVecEnvExecutor method)
(PointEnv method)
,
[1]
(Policy method)
,
[1]
,
[2]
,
[3]
(Resize method)
,
[1]
(ScriptedPolicy method)
,
[1]
(StackFrames method)
,
[1]
(VecEnvExecutor method)
Resize (class in garage.envs.wrappers)
(class in garage.envs.wrappers.resize)
restore() (LocalRunner method)
,
[1]
resume() (LocalRunner method)
,
[1]
RLAlgorithm (class in garage.np.algos.base)
rollout() (in module garage.sampler.utils)
round_robin_strategy() (in module garage.envs.multi_env_wrapper)
run_collect() (StatefulPool method)
run_each() (StatefulPool method)
run_experiment() (in module garage.experiment)
(in module garage.experiment.experiment)
run_imap_unordered() (StatefulPool method)
run_map() (StatefulPool method)
S
sample() (Bernoulli method)
,
[1]
(Categorical method)
,
[1]
(DiagonalGaussian method)
,
[1]
(HerReplayBuffer method)
,
[1]
(ReplayBuffer method)
(SimpleReplayBuffer method)
,
[1]
sample_path() (PathBuffer method)
,
[1]
sample_paths() (in module garage.sampler.parallel_sampler)
sample_predict() (BernoulliMLPRegressor method)
,
[1]
(ProductRegressor method)
,
[1]
sample_sym() (Categorical method)
,
[1]
sample_transitions() (PathBuffer method)
,
[1]
Sampler (class in garage.sampler.base)
save() (LocalRunner method)
,
[1]
save_itr_params() (Snapshotter method)
,
[1]
ScriptedPolicy (class in garage.np.policies)
(class in garage.np.policies.scripted_policy)
Sequential (class in garage.tf.models)
(class in garage.tf.models.sequential)
set() (LazyDict method)
set_param_values() (Baseline method)
,
[1]
(ContinuousMLPBaseline method)
,
[1]
(GaussianCNNBaseline method)
,
[1]
(GaussianMLPBaseline method)
,
[1]
(LinearFeatureBaseline method)
,
[1]
(Policy method)
,
[1]
(ProductRegressor method)
,
[1]
(Regressor method)
,
[1]
(ScriptedPolicy method)
,
[1]
(ZeroBaseline method)
,
[1]
set_seed() (in module garage.experiment.deterministic)
(in module garage.sampler.parallel_sampler)
setup() (LocalRunner method)
,
[1]
(LocalTFRunner method)
,
[1]
SharedGlobal (class in garage.sampler.stateful_pool)
shutdown_worker() (BatchSampler method)
(OffPolicyVectorizedSampler method)
(OnPolicyVectorizedSampler method)
(Sampler method)
SimpleReplayBuffer (class in garage.replay_buffer)
(class in garage.replay_buffer.simple_replay_buffer)
simulate() (OUStrategy method)
,
[1]
sliced_fun() (in module garage.tf.optimizers.utils)
snapshot_dir (SnapshotConfig attribute)
,
[1]
(Snapshotter attribute)
,
[1]
snapshot_gap (SnapshotConfig attribute)
,
[1]
(Snapshotter attribute)
,
[1]
snapshot_mode (SnapshotConfig attribute)
,
[1]
(Snapshotter attribute)
,
[1]
SnapshotConfig (class in garage.experiment)
(class in garage.experiment.snapshotter)
Snapshotter (class in garage.experiment)
(class in garage.experiment.snapshotter)
split_tensor_dict_list() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
stack_tensor_dict_list() (in module garage.misc.tensor_utils)
(in module garage.tf.misc.tensor_utils)
stack_tensor_list() (in module garage.tf.misc.tensor_utils)
StackFrames (class in garage.envs.wrappers)
(class in garage.envs.wrappers.stack_frames)
start() (Plotter method)
,
[1]
start_worker() (BatchSampler method)
(OffPolicyVectorizedSampler method)
(OnPolicyVectorizedSampler method)
(Sampler method)
state_info_keys (Policy attribute)
,
[1]
,
[2]
,
[3]
state_info_specs (CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(Policy attribute)
,
[1]
StatefulPool (class in garage.sampler.stateful_pool)
step() (AtariEnv method)
,
[1]
(ClipReward method)
,
[1]
(EpisodicLife method)
,
[1]
(FireReset method)
,
[1]
(GarageEnv method)
,
[1]
(Grayscale method)
,
[1]
(GridWorldEnv method)
,
[1]
Step() (in module garage.envs)
(in module garage.envs.base)
step() (MaxAndSkip method)
,
[1]
(MultiEnvWrapper method)
(Noop method)
,
[1]
(NormalizedEnv method)
(ParallelVecEnvExecutor method)
(PointEnv method)
,
[1]
(Resize method)
,
[1]
(StackFrames method)
,
[1]
(VecEnvExecutor method)
step_epochs() (LocalRunner method)
,
[1]
StochasticPolicy (class in garage.np.policies)
(class in garage.np.policies.base)
(class in garage.tf.policies)
(class in garage.tf.policies.base)
StochasticRegressor (class in garage.tf.regressors)
(class in garage.tf.regressors.base)
stop() (ProgBarCounter method)
store_episode() (ReplayBuffer method)
T
task_space (MultiEnvWrapper attribute)
terminate() (Policy method)
,
[1]
,
[2]
,
[3]
terminate_task() (in module garage.sampler.parallel_sampler)
TfEnv (class in garage.tf.envs)
(class in garage.tf.envs.base)
to_local_command() (in module garage.experiment)
(in module garage.experiment.experiment)
to_name_suffix() (VariantGenerator method)
,
[1]
torch_to_np() (in module garage.torch.utils)
train() (LocalRunner method)
,
[1]
(RLAlgorithm method)
truncate_paths() (in module garage.sampler.utils)
truncate_tensor_dict() (in module garage.misc.tensor_utils)
U
unflatten_tensor_variables() (in module garage.tf.misc.tensor_utils)
unflatten_tensors() (in module garage.misc.tensor_utils)
uniform_random_strategy() (in module garage.envs.multi_env_wrapper)
UniformControlPolicy (class in garage.tf.policies.uniform_control_policy)
uniq() (in module garage.experiment.nb_utils)
unique() (ExperimentDatabase method)
update() (BatchDataset method)
,
[1]
update_hvp() (FiniteDifferenceHvp method)
,
[1]
(HessianVectorProduct method)
(PearlmutterHvp method)
update_opt() (ConjugateGradientOptimizer method)
,
[1]
(FirstOrderOptimizer method)
,
[1]
(LbfgsOptimizer method)
,
[1]
(PenaltyLbfgsOptimizer method)
,
[1]
update_plot() (Plotter method)
,
[1]
,
[2]
,
[3]
V
variant() (in module garage.experiment)
(in module garage.experiment.experiment)
variant_dict() (VariantGenerator method)
,
[1]
VariantDict (class in garage.experiment.experiment)
VariantGenerator (class in garage.experiment)
(class in garage.experiment.experiment)
variants() (VariantGenerator method)
,
[1]
VecEnvExecutor (class in garage.sampler.vec_env_executor)
vectorized (CategoricalCNNPolicy attribute)
,
[1]
(CategoricalGRUPolicy attribute)
,
[1]
(CategoricalLSTMPolicy attribute)
,
[1]
(CategoricalMLPPolicy attribute)
,
[1]
(ContinuousMLPPolicy attribute)
,
[1]
(DiscreteQfDerivedPolicy attribute)
,
[1]
(GaussianGRUPolicy attribute)
,
[1]
(GaussianLSTMPolicy attribute)
,
[1]
(GaussianMLPPolicy attribute)
,
[1]
,
[2]
,
[3]
(Policy attribute)
,
[1]
,
[2]
,
[3]
(UniformControlPolicy attribute)
W
worker_init_envs() (in module garage.sampler.parallel_vec_env_executor)
worker_run_reset() (in module garage.sampler.parallel_vec_env_executor)
worker_run_step() (in module garage.sampler.parallel_vec_env_executor)
Z
ZeroBaseline (class in garage.np.baselines)
(class in garage.np.baselines.zero_baseline)
Read the Docs
v: v2019.10.2
Versions
latest
stable
v2020.06.0
v2019.10.2
v2019.10.1
v2019.10.0
v2019.02.2
v2019.02.1
v2019.02.0
v2018.10.1
v2018.10.0
Downloads
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.