.gitignore
.pre-commit-config.yaml
CITATION.cff
CONTRIBUTING.md
LICENSE
README.md
pyproject.toml
requirements.txt
setup.py
.github/workflows/ci.yml
.github/workflows/conda-publish.yml
.github/workflows/docs-build.yml
.github/workflows/docs.yml
.github/workflows/pre-commit.yml
.github/workflows/pypi-publish.yml
.github/workflows/tests.yml
comlrl/__init__.py
comlrl.egg-info/PKG-INFO
comlrl.egg-info/SOURCES.txt
comlrl.egg-info/dependency_links.txt
comlrl.egg-info/requires.txt
comlrl.egg-info/top_level.txt
comlrl/models/__init__.py
comlrl/models/actor_critic.py
comlrl/trainers/__init__.py
comlrl/trainers/actor_critic/__init__.py
comlrl/trainers/actor_critic/ac_base.py
comlrl/trainers/actor_critic/iac.py
comlrl/trainers/actor_critic/maac.py
comlrl/trainers/reinforce/__init__.py
comlrl/trainers/reinforce/magrpo.py
comlrl/trainers/reinforce/mareinforce.py
comlrl/trainers/reinforce/maremax.py
comlrl/trainers/reinforce/marloo.py
comlrl/utils/__init__.py
comlrl/utils/formatters.py
comlrl/utils/model_loading.py
comlrl/utils/reward_processor.py
comlrl/utils/reward_utils.py
comlrl/utils/tokenizer_utils.py
docs/.gitignore
docs/.trigger
docs/README.md
docs/go.mod
docs/go.sum
docs/hugo.toml
docs/assets/_custom.scss
docs/assets/ac.svg
docs/assets/align-tree.svg
docs/assets/comlrl-icon.png
docs/assets/comlrl-icon.svg
docs/assets/comlrl-logo.png
docs/assets/comlrl.png
docs/assets/cross-tree.svg
docs/assets/demo.gif
docs/assets/email.svg
docs/assets/joint-tree.svg
docs/assets/katex.json
docs/assets/sponsors.jpg
docs/content/_index.md
docs/content/docs/dev/_index.md
docs/content/docs/dev/changelog.md
docs/content/docs/dev/contributing.md
docs/content/docs/dev/support.md
docs/content/docs/env/_index.md
docs/content/docs/env/code-completion.md
docs/content/docs/env/coding.md
docs/content/docs/env/minecraft.md
docs/content/docs/env/writing.md
docs/content/docs/examples/_index.md
docs/content/docs/examples/comlrl-quick-start.md
docs/content/docs/user-guide/_index.md
docs/content/docs/user-guide/installation.md
docs/content/docs/user-guide/model-loading.md
docs/content/docs/user-guide/multi-agent-actor-critic.md
docs/content/docs/user-guide/multi-agent-reinforce.md
docs/content/docs/user-guide/multi-turn-training.md
docs/layouts/_partials/docs/inject/head.html
docs/static/css/sidebar.css
docs/static/img/ac.svg
docs/static/img/align-tree.svg
docs/static/img/comlrl-icon.png
docs/static/img/comlrl-icon.svg
docs/static/img/comlrl-logo.png
docs/static/img/cross-tree.svg
docs/static/img/demo.gif
docs/static/img/joint-tree.svg
examples/leetcode-func-print.py
examples/story-len-ratio.py
examples/tldr-len-ratio.py
tests/test_config_constraints.py
tests/test_model_loading.py
tests/test_trainer_constraints.py