CHANGELOG.md
CONTRIBUTING.md
LICENSE
MANIFEST.in
Makefile
README.md
VERSION
setup.cfg
setup.py
docker/Dockerfile.base.16.04
docker/Dockerfile.base.18.04
docker/Dockerfile.headless
docker/Dockerfile.nvidia
docker/Dockerfile.runtime
docker/README.md
docker/docker-compose-ci.yml
docker/docker-compose-headless.yml
docker/docker-compose-nvidia.yml
docker/entrypoint-headless.sh
docker/entrypoint-runtime.sh
docs/Makefile
docs/conf.py
docs/index.rst
docs/requirements.txt
docs/user/experiments.rst
docs/user/implement_algo_advanced.rst
docs/user/implement_algo_basic.rst
docs/user/implement_env.rst
docs/user/installation.rst
examples/resume_training.py
examples/sim_policy.py
examples/step_dm_control_env.py
examples/step_env.py
examples/jupyter/custom_env.ipynb
examples/jupyter/trpo_gym_tf_cartpole.ipynb
examples/np/cem_cartpole.py
examples/np/cma_es_cartpole.py
examples/tf/ddpg_pendulum.py
examples/tf/dqn_cartpole.py
examples/tf/dqn_pong.py
examples/tf/erwr_cartpole.py
examples/tf/her_ddpg_fetchreach.py
examples/tf/multi_env_ppo.py
examples/tf/ppo_memorize_digits.py
examples/tf/ppo_pendulum.py
examples/tf/reps_gym_cartpole.py
examples/tf/td3_pendulum.py
examples/tf/trpo_cartpole.py
examples/tf/trpo_cartpole_batch_sampler.py
examples/tf/trpo_cartpole_recurrent.py
examples/tf/trpo_cubecrash.py
examples/tf/trpo_gym_tf_cartpole.py
examples/tf/trpo_swimmer.py
examples/tf/trpo_swimmer_ray_sampler.py
examples/tf/trpois_inverted_pendulum.py
examples/tf/vpg_cartpole.py
examples/tf/vpgis_inverted_pendulum.py
examples/torch/ddpg_pendulum.py
examples/torch/vpg_pendulum.py
scripts/check_commit_message
scripts/garage
scripts/setup_colab.sh
scripts/setup_linux.sh
scripts/setup_macos.sh
scripts/travisci/check_precommit.sh
src/garage/__init__.py
src/garage.egg-info/PKG-INFO
src/garage.egg-info/SOURCES.txt
src/garage.egg-info/dependency_links.txt
src/garage.egg-info/requires.txt
src/garage.egg-info/top_level.txt
src/garage/envs/__init__.py
src/garage/envs/base.py
src/garage/envs/env_spec.py
src/garage/envs/grid_world_env.py
src/garage/envs/multi_env_wrapper.py
src/garage/envs/normalized_env.py
src/garage/envs/point_env.py
src/garage/envs/dm_control/__init__.py
src/garage/envs/dm_control/dm_control_env.py
src/garage/envs/dm_control/dm_control_viewer.py
src/garage/envs/wrappers/__init__.py
src/garage/envs/wrappers/atari_env.py
src/garage/envs/wrappers/clip_reward.py
src/garage/envs/wrappers/episodic_life.py
src/garage/envs/wrappers/fire_reset.py
src/garage/envs/wrappers/grayscale.py
src/garage/envs/wrappers/max_and_skip.py
src/garage/envs/wrappers/noop.py
src/garage/envs/wrappers/resize.py
src/garage/envs/wrappers/stack_frames.py
src/garage/experiment/__init__.py
src/garage/experiment/deterministic.py
src/garage/experiment/experiment.py
src/garage/experiment/experiment_wrapper.py
src/garage/experiment/local_runner.py
src/garage/experiment/nb_utils.py
src/garage/experiment/snapshotter.py
src/garage/misc/__init__.py
src/garage/misc/prog_bar_counter.py
src/garage/misc/tensor_utils.py
src/garage/np/__init__.py
src/garage/np/algos/__init__.py
src/garage/np/algos/base.py
src/garage/np/algos/batch_polopt.py
src/garage/np/algos/cem.py
src/garage/np/algos/cma_es.py
src/garage/np/algos/nop.py
src/garage/np/algos/off_policy_rl_algorithm.py
src/garage/np/baselines/__init__.py
src/garage/np/baselines/base.py
src/garage/np/baselines/linear_feature_baseline.py
src/garage/np/baselines/zero_baseline.py
src/garage/np/exploration_strategies/__init__.py
src/garage/np/exploration_strategies/base.py
src/garage/np/exploration_strategies/epsilon_greedy_strategy.py
src/garage/np/exploration_strategies/gaussian_strategy.py
src/garage/np/exploration_strategies/ou_strategy.py
src/garage/np/optimizers/__init__.py
src/garage/np/optimizers/minibatch_dataset.py
src/garage/np/policies/__init__.py
src/garage/np/policies/base.py
src/garage/np/policies/scripted_policy.py
src/garage/np/q_functions/__init__.py
src/garage/np/q_functions/base.py
src/garage/np/regressors/__init__.py
src/garage/np/regressors/product_regressor.py
src/garage/plotter/__init__.py
src/garage/plotter/plotter.py
src/garage/replay_buffer/__init__.py
src/garage/replay_buffer/base.py
src/garage/replay_buffer/her_replay_buffer.py
src/garage/replay_buffer/path_buffer.py
src/garage/replay_buffer/simple_replay_buffer.py
src/garage/sampler/__init__.py
src/garage/sampler/base.py
src/garage/sampler/batch_sampler.py
src/garage/sampler/is_sampler.py
src/garage/sampler/off_policy_vectorized_sampler.py
src/garage/sampler/on_policy_vectorized_sampler.py
src/garage/sampler/parallel_sampler.py
src/garage/sampler/parallel_vec_env_executor.py
src/garage/sampler/ray_sampler.py
src/garage/sampler/stateful_pool.py
src/garage/sampler/utils.py
src/garage/sampler/vec_env_executor.py
src/garage/tf/__init__.py
src/garage/tf/algos/__init__.py
src/garage/tf/algos/batch_polopt.py
src/garage/tf/algos/ddpg.py
src/garage/tf/algos/dqn.py
src/garage/tf/algos/erwr.py
src/garage/tf/algos/npo.py
src/garage/tf/algos/ppo.py
src/garage/tf/algos/reps.py
src/garage/tf/algos/td3.py
src/garage/tf/algos/tnpg.py
src/garage/tf/algos/trpo.py
src/garage/tf/algos/vpg.py
src/garage/tf/baselines/__init__.py
src/garage/tf/baselines/continuous_mlp_baseline.py
src/garage/tf/baselines/gaussian_cnn_baseline.py
src/garage/tf/baselines/gaussian_mlp_baseline.py
src/garage/tf/distributions/__init__.py
src/garage/tf/distributions/base.py
src/garage/tf/distributions/bernoulli.py
src/garage/tf/distributions/categorical.py
src/garage/tf/distributions/diagonal_gaussian.py
src/garage/tf/distributions/recurrent_categorical.py
src/garage/tf/distributions/recurrent_diagonal_gaussian.py
src/garage/tf/envs/__init__.py
src/garage/tf/envs/base.py
src/garage/tf/experiment/__init__.py
src/garage/tf/experiment/local_tf_runner.py
src/garage/tf/misc/__init__.py
src/garage/tf/misc/tensor_utils.py
src/garage/tf/models/__init__.py
src/garage/tf/models/base.py
src/garage/tf/models/cnn.py
src/garage/tf/models/cnn_model.py
src/garage/tf/models/cnn_model_max_pooling.py
src/garage/tf/models/gaussian_cnn_model.py
src/garage/tf/models/gaussian_gru_model.py
src/garage/tf/models/gaussian_lstm_model.py
src/garage/tf/models/gaussian_mlp_model.py
src/garage/tf/models/gru.py
src/garage/tf/models/gru_model.py
src/garage/tf/models/lstm.py
src/garage/tf/models/lstm_model.py
src/garage/tf/models/mlp.py
src/garage/tf/models/mlp_dueling_model.py
src/garage/tf/models/mlp_merge_model.py
src/garage/tf/models/mlp_model.py
src/garage/tf/models/normalized_input_mlp_model.py
src/garage/tf/models/parameter.py
src/garage/tf/models/sequential.py
src/garage/tf/optimizers/__init__.py
src/garage/tf/optimizers/conjugate_gradient_optimizer.py
src/garage/tf/optimizers/first_order_optimizer.py
src/garage/tf/optimizers/lbfgs_optimizer.py
src/garage/tf/optimizers/penalty_lbfgs_optimizer.py
src/garage/tf/optimizers/utils.py
src/garage/tf/plotter/__init__.py
src/garage/tf/plotter/plotter.py
src/garage/tf/policies/__init__.py
src/garage/tf/policies/base.py
src/garage/tf/policies/categorical_cnn_policy.py
src/garage/tf/policies/categorical_gru_policy.py
src/garage/tf/policies/categorical_lstm_policy.py
src/garage/tf/policies/categorical_mlp_policy.py
src/garage/tf/policies/continuous_mlp_policy.py
src/garage/tf/policies/discrete_qf_derived_policy.py
src/garage/tf/policies/gaussian_gru_policy.py
src/garage/tf/policies/gaussian_lstm_policy.py
src/garage/tf/policies/gaussian_mlp_policy.py
src/garage/tf/policies/uniform_control_policy.py
src/garage/tf/q_functions/__init__.py
src/garage/tf/q_functions/base.py
src/garage/tf/q_functions/continuous_mlp_q_function.py
src/garage/tf/q_functions/discrete_cnn_q_function.py
src/garage/tf/q_functions/discrete_mlp_q_function.py
src/garage/tf/regressors/__init__.py
src/garage/tf/regressors/base.py
src/garage/tf/regressors/bernoulli_mlp_regressor.py
src/garage/tf/regressors/categorical_mlp_regressor.py
src/garage/tf/regressors/continuous_mlp_regressor.py
src/garage/tf/regressors/gaussian_cnn_regressor.py
src/garage/tf/regressors/gaussian_cnn_regressor_model.py
src/garage/tf/regressors/gaussian_mlp_regressor.py
src/garage/tf/regressors/gaussian_mlp_regressor_model.py
src/garage/tf/samplers/__init__.py
src/garage/tf/samplers/batch_sampler.py
src/garage/tf/samplers/ray_sampler.py
src/garage/torch/__init__.py
src/garage/torch/utils.py
src/garage/torch/algos/__init__.py
src/garage/torch/algos/ddpg.py
src/garage/torch/algos/loss_function_utils.py
src/garage/torch/algos/vpg.py
src/garage/torch/modules/__init__.py
src/garage/torch/modules/gaussian_mlp_module.py
src/garage/torch/modules/mlp_module.py
src/garage/torch/modules/multi_headed_mlp_module.py
src/garage/torch/policies/__init__.py
src/garage/torch/policies/base.py
src/garage/torch/policies/deterministic_mlp_policy.py
src/garage/torch/policies/gaussian_mlp_policy.py
src/garage/torch/q_functions/__init__.py
src/garage/torch/q_functions/continuous_mlp_q_function.py
tests/__init__.py
tests/helpers.py
tests/mock.py
tests/quirks.py
tests/wrappers.py
tests/benchmarks/README.md
tests/benchmarks/__init__.py
tests/benchmarks/garage/__init__.py
tests/benchmarks/garage/tf/__init__.py
tests/benchmarks/garage/tf/algos/__init__.py
tests/benchmarks/garage/tf/algos/test_benchmark_ddpg.py
tests/benchmarks/garage/tf/algos/test_benchmark_her.py
tests/benchmarks/garage/tf/algos/test_benchmark_ppo.py
tests/benchmarks/garage/tf/algos/test_benchmark_td3.py
tests/benchmarks/garage/tf/algos/test_benchmark_trpo.py
tests/benchmarks/garage/tf/algos/test_benchmark_vpg.py
tests/benchmarks/garage/tf/baselines/__init__.py
tests/benchmarks/garage/tf/baselines/test_benchmark_gaussian_cnn_baseline.py
tests/benchmarks/garage/tf/baselines/test_benchmark_gaussian_mlp_baseline.py
tests/benchmarks/garage/tf/policies/__init__.py
tests/benchmarks/garage/tf/policies/test_benchmark_categorical_cnn_policy.py
tests/benchmarks/garage/tf/policies/test_benchmark_categorical_gru_policy.py
tests/benchmarks/garage/tf/policies/test_benchmark_categorical_lstm_policy.py
tests/benchmarks/garage/tf/policies/test_benchmark_categorical_mlp_policy.py
tests/benchmarks/garage/tf/policies/test_benchmark_continuous_mlp_policy.py
tests/benchmarks/garage/tf/policies/test_benchmark_gaussian_gru_policy.py
tests/benchmarks/garage/tf/policies/test_benchmark_gaussian_lstm_policy.py
tests/benchmarks/garage/tf/policies/test_benchmark_gaussian_mlp_policy.py
tests/benchmarks/garage/tf/q_functions/__init__.py
tests/benchmarks/garage/tf/q_functions/test_benchmark_continuous_mlp_q_function.py
tests/fixtures/__init__.py
tests/fixtures/fixtures.py
tests/fixtures/logger.py
tests/fixtures/algos/__init__.py
tests/fixtures/algos/dummy_algo.py
tests/fixtures/algos/dummy_tf_algo.py
tests/fixtures/algos/instrumented_batch_polopt.py
tests/fixtures/algos/instrumented_nop.py
tests/fixtures/algos/nop_pendulum_instrumented.py
tests/fixtures/distributions/__init__.py
tests/fixtures/distributions/dummy_distribution.py
tests/fixtures/envs/__init__.py
tests/fixtures/envs/dummy/__init__.py
tests/fixtures/envs/dummy/base.py
tests/fixtures/envs/dummy/dummy_box_env.py
tests/fixtures/envs/dummy/dummy_dict_env.py
tests/fixtures/envs/dummy/dummy_discrete_2d_env.py
tests/fixtures/envs/dummy/dummy_discrete_env.py
tests/fixtures/envs/dummy/dummy_discrete_pixel_env.py
tests/fixtures/envs/dummy/dummy_discrete_pixel_env_baselines.py
tests/fixtures/envs/dummy/dummy_reward_box_env.py
tests/fixtures/envs/wrappers/__init__.py
tests/fixtures/envs/wrappers/reshape_observation.py
tests/fixtures/experiment/__init__.py
tests/fixtures/experiment/fixture_experiment.py
tests/fixtures/models/__init__.py
tests/fixtures/models/simple_cnn_model.py
tests/fixtures/models/simple_cnn_model_with_max_pooling.py
tests/fixtures/models/simple_gaussian_cnn_model.py
tests/fixtures/models/simple_gaussian_gru_model.py
tests/fixtures/models/simple_gaussian_lstm_model.py
tests/fixtures/models/simple_gaussian_mlp_model.py
tests/fixtures/models/simple_gru_model.py
tests/fixtures/models/simple_lstm_model.py
tests/fixtures/models/simple_mlp_merge_model.py
tests/fixtures/models/simple_mlp_model.py
tests/fixtures/policies/__init__.py
tests/fixtures/policies/dummy_policy.py
tests/fixtures/policies/dummy_recurrent_policy.py
tests/fixtures/q_functions/__init__.py
tests/fixtures/q_functions/simple_q_function.py
tests/fixtures/regressors/__init__.py
tests/fixtures/regressors/simple_gaussian_cnn_regressor.py
tests/fixtures/regressors/simple_gaussian_mlp_regressor.py
tests/fixtures/regressors/simple_mlp_regressor.py
tests/fixtures/tf/__init__.py
tests/fixtures/tf/instrumented_batch_polopt.py
tests/fixtures/tf/instrumented_npo.py
tests/fixtures/tf/instrumented_trpo.py
tests/fixtures/tf/trpo_pendulum_instrumented.py
tests/fixtures/tf/algos/dummy_off_policy_algo.py
tests/garage/.pylintrc
tests/garage/__init__.py
tests/garage/envs/__init__.py
tests/garage/envs/test_env_spec.py
tests/garage/envs/test_grid_world_env.py
tests/garage/envs/test_multi_env_wrapper.py
tests/garage/envs/test_normalized_env.py
tests/garage/envs/test_normalized_gym.py
tests/garage/envs/test_point_env.py
tests/garage/envs/box2d/parser/__init__.py
tests/garage/envs/dm_control/__init__.py
tests/garage/envs/dm_control/test_dm_control_env.py
tests/garage/envs/dm_control/test_dm_control_tf_policy.py
tests/garage/envs/wrappers/__init__.py
tests/garage/envs/wrappers/test_atari_env.py
tests/garage/envs/wrappers/test_clip_reward.py
tests/garage/envs/wrappers/test_episodic_life.py
tests/garage/envs/wrappers/test_fire_reset.py
tests/garage/envs/wrappers/test_grayscale_env.py
tests/garage/envs/wrappers/test_max_and_skip.py
tests/garage/envs/wrappers/test_noop.py
tests/garage/envs/wrappers/test_resize_env.py
tests/garage/envs/wrappers/test_stack_frames_env.py
tests/garage/experiment/__init__.py
tests/garage/experiment/test_deterministic.py
tests/garage/experiment/test_experiment.py
tests/garage/experiment/test_experiment_wrapper.py
tests/garage/experiment/test_resume.py
tests/garage/experiment/test_snapshotter.py
tests/garage/experiment/test_snapshotter_integration.py
tests/garage/misc/__init__.py
tests/garage/misc/test_tensor_utils.py
tests/garage/np/__init__.py
tests/garage/np/algos/__init__.py
tests/garage/np/algos/test_batch_polopt.py
tests/garage/np/algos/test_cem.py
tests/garage/np/algos/test_cma_es.py
tests/garage/np/exploration_strategies/__init__.py
tests/garage/np/exploration_strategies/test_epsilon_greedy_strategy.py
tests/garage/np/policies/test_scripted_policy.py
tests/garage/replay_buffer/__init__.py
tests/garage/replay_buffer/test_her_replay_buffer.py
tests/garage/replay_buffer/test_path_buffer.py
tests/garage/replay_buffer/test_replay_buffer.py
tests/garage/sampler/__init__.py
tests/garage/sampler/test_is_sampler.py
tests/garage/sampler/test_off_policy_vectorized_sampler_integration.py
tests/garage/sampler/test_on_policy_vectorized_sampler.py
tests/garage/sampler/test_ray_batched_sampler.py
tests/garage/sampler/test_sampler.py
tests/garage/sampler/test_stateful_pool.py
tests/garage/sampler/test_utils.py
tests/garage/tf/__init__.py
tests/garage/tf/algos/__init__.py
tests/garage/tf/algos/test_batch_polopt.py
tests/garage/tf/algos/test_ddpg.py
tests/garage/tf/algos/test_dqn.py
tests/garage/tf/algos/test_erwr.py
tests/garage/tf/algos/test_npo.py
tests/garage/tf/algos/test_ppo.py
tests/garage/tf/algos/test_reps.py
tests/garage/tf/algos/test_td3.py
tests/garage/tf/algos/test_tnpg.py
tests/garage/tf/algos/test_trpo.py
tests/garage/tf/algos/test_vpg.py
tests/garage/tf/baselines/__init__.py
tests/garage/tf/baselines/test_baselines.py
tests/garage/tf/baselines/test_continuous_mlp_baseline.py
tests/garage/tf/baselines/test_gaussian_cnn_baseline.py
tests/garage/tf/baselines/test_gaussian_mlp_baseline.py
tests/garage/tf/envs/__init__.py
tests/garage/tf/envs/test_base.py
tests/garage/tf/experiment/__init__.py
tests/garage/tf/experiment/test_local_tf_runner.py
tests/garage/tf/misc/__init__.py
tests/garage/tf/misc/test_tensor_utils.py
tests/garage/tf/models/__init__.py
tests/garage/tf/models/test_cnn.py
tests/garage/tf/models/test_cnn_model.py
tests/garage/tf/models/test_gaussian_cnn_model.py
tests/garage/tf/models/test_gaussian_gru_model.py
tests/garage/tf/models/test_gaussian_lstm_model.py
tests/garage/tf/models/test_gaussian_mlp_model.py
tests/garage/tf/models/test_gru.py
tests/garage/tf/models/test_gru_model.py
tests/garage/tf/models/test_lstm.py
tests/garage/tf/models/test_lstm_model.py
tests/garage/tf/models/test_mlp.py
tests/garage/tf/models/test_mlp_concat.py
tests/garage/tf/models/test_mlp_model.py
tests/garage/tf/models/test_model.py
tests/garage/tf/models/test_parameter.py
tests/garage/tf/optimizers/test_conjugate_gradient_optimizer.py
tests/garage/tf/policies/__init__.py
tests/garage/tf/policies/test_categorical_cnn_policy.py
tests/garage/tf/policies/test_categorical_gru_policy.py
tests/garage/tf/policies/test_categorical_lstm_policy.py
tests/garage/tf/policies/test_categorical_mlp_policy.py
tests/garage/tf/policies/test_categorical_policies.py
tests/garage/tf/policies/test_continuous_mlp_policy.py
tests/garage/tf/policies/test_gaussian_gru_policy.py
tests/garage/tf/policies/test_gaussian_lstm_policy.py
tests/garage/tf/policies/test_gaussian_mlp_policy.py
tests/garage/tf/policies/test_gaussian_policies.py
tests/garage/tf/policies/test_policies.py
tests/garage/tf/policies/test_qf_derived_policy.py
tests/garage/tf/q_functions/__init__.py
tests/garage/tf/q_functions/test_continuous_mlp_q_function.py
tests/garage/tf/q_functions/test_discrete_cnn_q_function.py
tests/garage/tf/q_functions/test_discrete_mlp_q_function.py
tests/garage/tf/regressors/__init__.py
tests/garage/tf/regressors/test_bernoulli_mlp_regressor.py
tests/garage/tf/regressors/test_categorical_mlp_regressor.py
tests/garage/tf/regressors/test_continuous_mlp_regressor.py
tests/garage/tf/regressors/test_gaussian_cnn_regressor.py
tests/garage/tf/regressors/test_gaussian_mlp_regressor.py
tests/garage/tf/samplers/__init__.py
tests/garage/tf/samplers/test_ray_batched_sampler_tf.py
tests/garage/torch/__init__.py
tests/garage/torch/algos/__init__.py
tests/garage/torch/algos/test_ddpg.py
tests/garage/torch/algos/test_loss_function_utils.py
tests/garage/torch/algos/test_vpg.py
tests/garage/torch/modules/test_gaussian_mlp_module.py
tests/garage/torch/modules/test_mlp_module.py
tests/garage/torch/modules/test_multi_headed_mlp_module.py
tests/garage/torch/policies/test_deterministic_mlp_policy.py
tests/garage/torch/policies/test_gaussian_mlp_policy.py
tests/garage/torch/q_functions/test_continuous_mlp_q_function.py
tests/integration_tests/__init__.py
tests/integration_tests/test_examples.py
tests/integration_tests/test_sigint.py