[aligntune.backends]
trl = aligntune.backends.trl:TRLBackend
unsloth = aligntune.backends.unsloth:UnslothBackend

[aligntune.evaluation]
custom = aligntune.eval.custom_runner:CustomEvalRunner
lm_eval = aligntune.eval.lm_eval_runner:LMEvalRunner

[aligntune.rewards]
factory = aligntune.rewards.core:RewardFunctionFactory
registry = aligntune.rewards.core:RewardRegistry

[aligntune.trainers]
trl_dpo = aligntune.backends.trl.rl.dpo.dpo:TRLDPOTrainer
trl_ppo = aligntune.backends.trl.rl.ppo.ppo:TRLPPOTrainer
trl_sft = aligntune.backends.trl.sft.sft:TRLSFTTrainer
unsloth_dpo = aligntune.backends.unsloth.rl.dpo.dpo:UnslothDPOTrainer
unsloth_grpo = aligntune.backends.unsloth.rl.grpo.grpo:EnhancedGRPOTrainer
unsloth_gspo = aligntune.backends.unsloth.rl.gspo.gspo:EnhancedGSPOTrainer
unsloth_ppo = aligntune.backends.unsloth.rl.ppo.ppo:UnslothPPOTrainer
unsloth_sft = aligntune.backends.unsloth.sft.sft:UnslothSFTTrainer

[console_scripts]
aligntune = aligntune.cli:main
at = aligntune.cli:main
