LICENSE
MANIFEST.in
README.md
pyproject.toml
setup.py
docs/concepts.md
docs/cookbook.md
docs/optimization_guide.md
docs/reward_cookbook.md
docs/usage.md
docs/images/llamagym.jpg
docs/images/llm_normalization_comparison.png
docs/images/llm_rewards_no_norm.png
docs/images/llm_rewards_std_norm.png
examples/advanced/advanced_components.py
examples/advanced/deep_reward_model.py
examples/advanced/gym_integration.py
examples/advanced/memory_example.py
examples/advanced/reward_optimization.py
examples/advanced/rlhf_example.py
examples/advanced/visualization.py
examples/basic/basic_example.py
rllama/__init__.py
rllama/engine.py
rllama/logger.py
rllama/memory.py
rllama/registry.py
rllama.egg-info/PKG-INFO
rllama.egg-info/SOURCES.txt
rllama.egg-info/dependency_links.txt
rllama.egg-info/requires.txt
rllama.egg-info/top_level.txt
rllama/dashboard/__init__.py
rllama/dashboard/visualizer.py
rllama/integration/__init__.py
rllama/integration/gym_wrapper.py
rllama/integration/stable_baselines.py
rllama/models/__init__.py
rllama/models/base.py
rllama/models/reward_models.py
rllama/models/trainer.py
rllama/rewards/__init__.py
rllama/rewards/base.py
rllama/rewards/composer.py
rllama/rewards/optimizer.py
rllama/rewards/registry.py
rllama/rewards/shaper.py
rllama/rewards/components/__init__.py
rllama/rewards/components/advanced.py
rllama/rewards/components/advanced_components.py
rllama/rewards/components/common.py
rllama/rewards/components/length_rewards.py
rllama/rewards/components/llm_components.py
rllama/rewards/components/llm_rewards.py
rllama/rewards/components/robotics_components.py
rllama/rewards/components/specific_rewards.py
rllama/rewards/components/learning/__init__.py
rllama/rewards/components/learning/adaptive.py
rllama/rewards/components/learning/adversarial.py
rllama/rewards/components/learning/meta.py
rllama/rlhf/__init__.py
rllama/rlhf/collector.py
rllama/rlhf/preference.py