.gitignore
CODE_OF_CONDUCT.md
CONTRIBUTING.md
LICENSE
MANIFEST.in
README.md
ROADMAP.md
mkdocs.yml
pyproject.toml
requirements.txt
setup.cfg
setup.py
.github/workflows/docs.yml
.github/workflows/python-publish.yml
bbrl/__init__.py
bbrl/_version.py
bbrl/workspace.py
bbrl.egg-info/PKG-INFO
bbrl.egg-info/SOURCES.txt
bbrl.egg-info/dependency_links.txt
bbrl.egg-info/top_level.txt
bbrl/agents/README.md
bbrl/agents/__init__.py
bbrl/agents/agent.py
bbrl/agents/asynchronous.py
bbrl/agents/dataloader.py
bbrl/agents/gyma.py
bbrl/agents/gymb.py
bbrl/agents/remote.py
bbrl/agents/utils.py
bbrl/utils/__init__.py
bbrl/utils/chrono.py
bbrl/utils/distributions.py
bbrl/utils/functional.py
bbrl/utils/functionalb.py
bbrl/utils/logger.py
bbrl/utils/replay_buffer.py
bbrl/utils/utils.py
bbrl/visu/__init__.py
bbrl/visu/common.py
bbrl/visu/play.py
bbrl/visu/svpg_histograms.py
bbrl/visu/visu_critics.py
bbrl/visu/visu_policies.py
docs/bbrl/index.html
docs/bbrl/workspace.html
docs/bbrl/agents/agent.html
docs/bbrl/agents/asynchronous.html
docs/bbrl/agents/dataloader.html
docs/bbrl/agents/gyma.html
docs/bbrl/agents/gymb.html
docs/bbrl/agents/index.html
docs/bbrl/agents/remote.html
docs/bbrl/agents/utils.html
docs/bbrl/utils/chrono.html
docs/bbrl/utils/functional.html
docs/bbrl/utils/functionalb.html
docs/bbrl/utils/index.html
docs/bbrl/utils/logger.html
docs/bbrl/utils/replay_buffer.html
docs/bbrl/utils/utils.html
docs/bbrl/visu/common.html
docs/bbrl/visu/index.html
docs/bbrl/visu/svpg_histograms.html
docs/bbrl/visu/visu_critics.html
docs/bbrl/visu/visu_policies.html
pdfs/2022/2022_SOTA.pdf
pdfs/2022/2022_pg.pdf
pdfs/2022/dp_2022.pdf
pdfs/2022/rld_intro.pdf
pdfs/2022/tab_rl_2022.pdf
pdfs/advanced/gcrl.pdf
pdfs/bbrl/bbrl_foundations.pdf
pdfs/deterministic/11_ddpg.pdf
pdfs/deterministic/Agent57.pdf
pdfs/deterministic/alpha0.pdf
pdfs/deterministic/alphaNPI.pdf
pdfs/deterministic/beyond_rainbow.pdf
pdfs/deterministic/ddpg.pdf
pdfs/deterministic/dp.pdf
pdfs/deterministic/dqn.pdf
pdfs/deterministic/hilbert.pdf
pdfs/deterministic/intro_rl.pdf
pdfs/deterministic/mcts.pdf
pdfs/deterministic/mcts_hilbert.pdf
pdfs/deterministic/mdp.pdf
pdfs/deterministic/off_policy_ddpg.pdf
pdfs/deterministic/ofp.pdf
pdfs/deterministic/ofp_correction.pdf
pdfs/deterministic/rb_mc_mbrl.pdf
pdfs/deterministic/rl.pdf
pdfs/ps/10_trpo_acktr.pdf
pdfs/ps/11_ppo.pdf
pdfs/ps/12_sac.pdf
pdfs/ps/13_rwr.pdf
pdfs/ps/14_wrap_up.pdf
pdfs/ps/1_ps_intro.pdf
pdfs/ps/2_ps_pb.pdf
pdfs/ps/3_pg_derivation1.pdf
pdfs/ps/4_pg_derivation2.pdf
pdfs/ps/5_pg_derivation3.pdf
pdfs/ps/6_baseline_AC.pdf
pdfs/ps/7_bias_variance.pdf
pdfs/ps/8_ofp.pdf
pdfs/ps/9_a2c.pdf
pdfs/ps/CS2621_TRPO_PPO.pdf
pdfs/ps/tqc.pdf
pdfs/regression/batch_lwr.pdf
pdfs/regression/batch_projec.pdf
pdfs/regression/gd_V2.pdf
pdfs/regression/grad_descent.pdf
pdfs/regression/intro_regression.pdf
pdfs/regression/iter_incr.pdf
pdfs/regression/lls.pdf
pdfs/regression/nn_reg.pdf
pdfs/regression/rbfn.pdf
pdfs/regression/robot_model_learning.pdf
tests/eval_agent.py
tests/test_gymagent_continuous_cartpole.py
tests/test_gymagent_continuous_pendulum.py
tests/test_gymagent_continuous_pendulum_a.py
tests/test_gymagent_discrete_cartpole.py
tests/test_rb.py