README.md
pyproject.toml
setup.py
FAI_RL.egg-info/PKG-INFO
FAI_RL.egg-info/SOURCES.txt
FAI_RL.egg-info/dependency_links.txt
FAI_RL.egg-info/entry_points.txt
FAI_RL.egg-info/requires.txt
FAI_RL.egg-info/top_level.txt
configs/__init__.py
configs/deepspeed/zero3_config_gpu1.json
configs/deepspeed/zero3_config_gpu2.json
configs/deepspeed/zero3_config_gpu4.json
configs/deepspeed/zero3_config_gpu8.json
configs/evaluation/mmlu/llama3_3B_recipe.yaml
configs/inference/llama3_3B_recipe.yaml
configs/training/dpo/llama3_3B_full_recipe.yaml
configs/training/dpo/llama3_3B_lora_recipe.yaml
configs/training/dpo/llama3_3B_qlora_recipe.yaml
configs/training/grpo/llama3_3B_full_recipe.yaml
configs/training/grpo/llama3_3B_lora_recipe.yaml
configs/training/gspo/llama3_3B_full_recipe.yaml
configs/training/gspo/llama3_3B_lora_recipe.yaml
configs/training/ppo/llama3_3B_full_recipe.yaml
configs/training/ppo/llama3_3B_lora_recipe.yaml
configs/training/ppo/llama3_3B_qlora_recipe.yaml
configs/training/sft/llama3_3B_full_recipe.yaml
configs/training/sft/llama3_3B_lora_recipe.yaml
configs/training/sft/llama3_3B_qlora_recipe.yaml
core/__init__.py
core/config.py
core/model_utils.py
core/trainer_base.py
evaluations/README.md
evaluations/__init__.py
evaluations/eval.py
inference/README.md
inference/__init__.py
inference/inference.py
trainers/README.md
trainers/__init__.py
trainers/dpo_trainer.py
trainers/grpo_trainer.py
trainers/gspo_trainer.py
trainers/ppo_trainer.py
trainers/sft_trainer.py
trainers/train.py
trainers/rewards/__init__.py
trainers/rewards/accuracy_rewards.py
trainers/rewards/format_rewards.py
trainers/templates/__init__.py
trainers/templates/gsm8k_template.py
trainers/templates/openmathinstruct_template.py
utils/__init__.py
utils/logging_utils.py
venv_deploy/share/jupyter/kernels/python3/kernel.json
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/install.json
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/package.json
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/schemas/@jupyter-widgets/jupyterlab-manager/plugin.json
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/static/third-party-licenses.json