configs/__init__.py,sha256=JPftAl0UOmUEW7_01z1Ldy367-6HDQymLUtb4cB-Os0,41
configs/deepspeed/zero3_config_gpu1.json,sha256=QS2PioI9GW0oAQ0U0-6hkJCig0CGL0Gon-XqvY5t5qI,887
configs/deepspeed/zero3_config_gpu2.json,sha256=QS2PioI9GW0oAQ0U0-6hkJCig0CGL0Gon-XqvY5t5qI,887
configs/deepspeed/zero3_config_gpu4.json,sha256=QS2PioI9GW0oAQ0U0-6hkJCig0CGL0Gon-XqvY5t5qI,887
configs/deepspeed/zero3_config_gpu8.json,sha256=QS2PioI9GW0oAQ0U0-6hkJCig0CGL0Gon-XqvY5t5qI,887
core/__init__.py,sha256=ZLoFWQbRZmA7N3sNO4jhtFWK4XK39WsL9E7SGGXTbPQ,503
core/config.py,sha256=Uxh6ZwmntzcJoIzixoZP1crC6ar94w-OK8oUr8ifqes,11861
core/model_utils.py,sha256=_AF1XPNZy-EJEfVHhJm8VYzI3AOrL4AVsEfNpNJibh4,6916
core/trainer_base.py,sha256=52r5rzK7b8IgOi5rRs6htMjRuLw37kgGSzYN_M4pH5w,12888
evaluations/README.md,sha256=fvhu5T3t0cEdvyxxsWl-0XEfUtsKtIl3Fk1HOTNs3sY,3346
evaluations/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
evaluations/eval.py,sha256=0tTQSKVgCJERBXjYCq0-9_4idAKrk-r3PL5CMGSeKek,24643
evaluations/eval_datasets/__init__.py,sha256=gG93AxYyIvhKzf51Med9CZbTYkWFpBD9SUTIbBlvkh0,320
evaluations/eval_datasets/gsm8k.py,sha256=5NnIp6SXaualIevnGpv0EjjDyU2e4SC4uSZMQyUJB9I,4529
evaluations/eval_datasets/mmlu.py,sha256=DQRZPNNWUxKNwRgBf5atdnKMU5AtxDusuU6amhMI97Q,4419
fai_rl-0.1.15.dist-info/licenses/LICENSE,sha256=NbkVt7vxbqv1qoOi4kNRYn3VzYu1mJ-SLyoByujD9H4,11310
inference/README.md,sha256=GLB-8x2mtQw5dpoZibxFIAybwXtzU7EUueJ4asv7DDA,3892
inference/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
inference/inference.py,sha256=Wtf7_7NUlas1PNMMqyMjkE5543YNTTHw2T3ybyzp9uU,25545
outputs/llama3-8B-inst-robloxguard-1.0-vanilla-v1-infer_summary.json,sha256=a3IOOCnfKLFDc-Tkpxp6uCN8s7f1ybyhGum0KLu_G2w,5065
outputs/robloxguard-1.0-v1-infer_summary.json,sha256=hqDkVoXCe-oQkwZFAXsxGS--KASZ9i3Z8F__r4Qhw0o,6724
recipes/__init__.py,sha256=JPftAl0UOmUEW7_01z1Ldy367-6HDQymLUtb4cB-Os0,41
recipes/evaluation/gsm8k/llama3_3B_vanilla.yaml,sha256=rQlgO5B64UfqlsRtiDwGl-Qtzd2G0qzl6wCwO8SpTiw,2257
recipes/evaluation/gsm8k/llama3_8B_vanilla.yaml,sha256=gTClptVRlsIcT6rWmC3Sc-Iw2_3n6kBhBwFWt320CQc,2257
recipes/evaluation/gsm8k/qwen3_4B.yaml,sha256=6xYlb3HX9eltGxWUmUdeMps3P-7f2JTP7RZqptTz0k8,2309
recipes/evaluation/gsm8k/qwen3_4B_multi_ckpt.yaml,sha256=0einjqTI2bf-Bq3yY6xd_T4NLrV6h-fIUlzhagok8aA,2459
recipes/evaluation/gsm8k/qwen3_4B_vanilla.yaml,sha256=GNe_zTIK7DjqmgaTmsZ1kY8M7Go1qWn31ROuXAlJ-so,2251
recipes/evaluation/gsm8k/qwen3_8B_vanilla.yaml,sha256=zATcSGQTnImGLDwqhpsRwtOdxar041G1SzurZJ-9qMQ,2232
recipes/evaluation/mmlu/llama3_3B.yaml,sha256=GSKqyzBspZZ9DDTLpzEAB9j2m8W2Vf3YTdNrDiFzOdg,2469
recipes/evaluation/mmlu/llama3_3B_api.yaml,sha256=kuDlu_wcstN8m9Nn0Q0bFOrlpGfhDGurdkt3rtGMe3U,2614
recipes/evaluation/mmlu/llama3_3B_multi_ckpt.yaml,sha256=-KAYT0oxSg06pisv_UiDSSYeb2dTgB9R2ox5dGHE_rU,2739
recipes/evaluation/mmlu/llama3_vanilla_3B.yaml,sha256=Lu2o_lZXWrAuV61A54a_OnhhRP3VvL0qGr7dz8rnSEI,2562
recipes/inference/llama3_3B.yaml,sha256=VTUSmP-ctidPTJvuniedsqGX0m-XXbTKf3vKhLeX918,1974
recipes/inference/llama3_3B_api.yaml,sha256=8KcTDTpSToDxjFaBftr8Kv7DTc0ZofPb2Ru1DjoiyPA,2395
recipes/inference/llama3_3B_local_csv.yaml,sha256=9uQRHyVwAgqgoPHUK818URWeswQBfg9jZR7RLBrPVqU,2091
recipes/inference/llama3_3B_multi_ckpt.yaml,sha256=GeMyfod0i-0TB-xgVJgUNvOASa0m3o5qdMJ4ZclKb2Q,2379
recipes/inference/llama3_vanilla_3B.yaml,sha256=o_-EIzf-H4kl8QiVC3vpXW8wK9OhNjt3F4G6vbbcZAg,2149
recipes/training/cpt/qwen3_30B_A3B_lora.yaml,sha256=wPUiSmm427lNaxZR1DDpIEzLfenCTXzmgqw9SFNud6M,5349
recipes/training/cpt/qwen3_30B_A3B_qlora.yaml,sha256=btTzolhdYZae4IE64vaKCrY7h3zR6XmaPQ-8-2AsmrU,5760
recipes/training/cpt/qwen3_4B_full.yaml,sha256=VL32jZH4fqDYj3aifZIm3XAKghZaOykeE2-FIQqfMa0,3763
recipes/training/cpt/qwen3_4B_lora.yaml,sha256=lPs7qheNmMy5r7cVwqgh253jzVFBVzdv5fg1qEC2k70,4432
recipes/training/cpt/qwen3_4B_qlora.yaml,sha256=bFwHY2KGwcXILfFeqqriIvNByJdTDDxX1zxz7MiHaMo,5766
recipes/training/dpo/llama3_3B_full.yaml,sha256=0dAXgvF4n6Hcj9-PeJ7JvFVUox2_y5VJyw3hvvWFCmI,5044
recipes/training/dpo/llama3_3B_lora.yaml,sha256=X26f15ShL-3Ad09EA18fzhzCXcc-z9valRwjLC_heTs,5761
recipes/training/dpo/llama3_3B_qlora.yaml,sha256=ZasGsvCIfhzHJCw6dGvHPE6qTHjqg32YP3PQ4uUCr7Y,7060
recipes/training/grpo/llama3_3B_full.yaml,sha256=XPqy1fowhZ6Be4kcjfZde-HRncypX5f1LM88ETftCUQ,5018
recipes/training/grpo/llama3_3B_lora.yaml,sha256=6i_7A8jQrQgccg3LpJLuleWq0Osyr1HyzwbBp8gMC-Q,5737
recipes/training/gspo/llama3_3B_full.yaml,sha256=sUdhTcM1X0XG9JTSIyiuUlKoHHBRk1w0Rgl-yhtMGCw,5632
recipes/training/gspo/llama3_3B_lora.yaml,sha256=u3W3acrCx92Fwn9QuYNz7_6HVYPdOwKNkTVxfYy1sz4,6419
recipes/training/ppo/llama3_3B_full.yaml,sha256=efkQ953tjOmh_4wD8Ey3VZ8kWkfXSv-bGuz-PmYfvro,4559
recipes/training/ppo/llama3_3B_lora.yaml,sha256=50C-lgfJ61MGbjpXLViiY1Y3tKVtzZ1V82idGWVnfVE,5234
recipes/training/ppo/llama3_3B_qlora.yaml,sha256=P-TLyxa2AuFG4o5fjT1dCNPBKBaADdaEh2xgGGhmGMs,5600
recipes/training/sft/llama3_3B_full.yaml,sha256=ND-GqR-8vLEU3wXYKjiPKv2CNdkVqjhUwRWqR9-rQd8,4955
recipes/training/sft/llama3_3B_lora.yaml,sha256=sv_fySJqkxWtvf_RVNwOIORwmiRJa0ZlfEpXGwwCHKc,5665
recipes/training/sft/llama3_3B_qlora.yaml,sha256=sYPLhHDMjB0jfseo9Ee1dkPvHx0yQy8WPY_PJpePNvo,6030
trainers/README.md,sha256=exFjJWsziSQGOXRhzgOpc_5uOrkuR7xLJG8FxF325_I,6714
trainers/__init__.py,sha256=4zwmjoSRgoJwm5gnNa44Vw4xyY_3I3UXgX9c0aedi10,378
trainers/cpt_trainer.py,sha256=FCq1izexhsPmPIcH7lUdEkQGv77sIMp89-RoIrDTrVg,6847
trainers/dpo_trainer.py,sha256=BGMQs1d3GGcG4MM_DkmSZVUmjNsJ3OuX13B9msaj-V8,9946
trainers/grpo_trainer.py,sha256=EEx7NqnXY92DrDQ5oJd6BVA7oj1-FL8JeLSF4eg6ZJU,10836
trainers/gspo_trainer.py,sha256=wkJmi04o-5ndtRHg7jGnjHpPLIs5ZWjJaoDCgkS9c3Y,11242
trainers/ppo_trainer.py,sha256=jrfMlSfnOx0kv7pA16j1FxljR3bBU984qvpoqaRzpmI,16909
trainers/sft_trainer.py,sha256=heDeQVO0TLQGNRHHddljF0uvMCRyljo2DZC1YHUfaA8,8282
trainers/train.py,sha256=KVqSBjaseZvi4pzbgnyxHrZ2gF3aGYEkS5XXMyzfuXk,14049
trainers/rewards/__init__.py,sha256=1n7-T_HVBsCUh6g3VSA9kbkYZtKOxP4xcZtZN7lKS_k,138
trainers/rewards/accuracy_rewards.py,sha256=_UaSi9AO3YU7F7ElQDHjwGRPtSyzWgkV1Jy2wpObvAg,2012
trainers/rewards/custom_rewards.py,sha256=wU5kdglfVwSLh-yQYZMaOqjzzRuZ2oToAuz4n-U2l6w,1815
trainers/rewards/format_rewards.py,sha256=9yyMqLll0-1Koh1hCdsu33RtQ3jO3QaQeTQrRJHuSMk,684
trainers/templates/__init__.py,sha256=LjHvIpd2MlC5KXj-ytZeGlB6RKBdxse-SmNs5KX9Kto,210
trainers/templates/gsm8k_template.py,sha256=QE4ztuGHCkcxfFpRtF0laEfkqVeexT3R9594TIWmhRM,1568
trainers/templates/openmathinstruct_template.py,sha256=A09p8_pqJ1ncdFoj377bF37v9IsN-wUj31gorP8Mda0,1410
utils/__init__.py,sha256=Lfu5757fBA3Pqy2G8QGbSG090Lp_E09vb26iha4049s,1515
utils/api_utils.py,sha256=f1p9ucSc-r70Cs3g8KULL7cBXIRKcnEHHi5wDeGKK_s,12581
utils/config_validation.py,sha256=Lxy_8jZY0OyMI1rv8Xk3Kka6TCr16gSzW318dh3WTqg,1751
utils/dataset_utils.py,sha256=NIIvvcU75PGOWid8Vu7CY60gCG2KV5PHXvfSBn9NlQU,1520
utils/device_utils.py,sha256=MHKrITUY2Z-ZpCIyvPoIMCYGFrtBE4MfiqRHAJES62A,14985
utils/hosted_llm_config.py,sha256=vBbPrFyWTy8VKKmb67DU3xZ0pTrqF6O5fcPCMnfjFQ8,8598
utils/logging_utils.py,sha256=f8-UbVwxuG7JfK8JHgvAD6qnAOaj5D2STjmZmsl_fs4,9360
utils/recipe_overrides.py,sha256=hx25PGBPJjBBTxNNxoTGXUwm87n9ffAfNeQBSvbXxpY,2220
utils/s3_utils.py,sha256=1Tm6ngGYr9CPY_Fj14jnybM1ztlAeFRojq4VYK3uwp0,5813
venv_deploy/share/jupyter/kernels/python3/kernel.json,sha256=69y5qspxusKKSbKfpYw86C4_UFV01AU6NtRuUi9t-kI,193
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/install.json,sha256=e65KcDNtdaA4aZgF1mLHIhwaoIzpH9LmUueG4iJYmI0,197
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/package.json,sha256=vmebfycAy9ffbvozQULkX7ZwWimcOH7gX3pG2PctTHE,3551
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/schemas/@jupyter-widgets/jupyterlab-manager/plugin.json,sha256=IWNBmBm-GTATCrzha5m-Kh0Gt6H4KzGsnzcuSigjx2A,375
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/static/third-party-licenses.json,sha256=rAEtxqfQ91D1yZL60D4LaDq1y5tR-5HE0ih2wdIEZoY,32961
fai_rl-0.1.15.dist-info/METADATA,sha256=ZkpCFpsTqtHQQQdfYQdMB6YOQpSvRPF894Y93a6XZqY,18114
fai_rl-0.1.15.dist-info/WHEEL,sha256=aeYiig01lYGDzBgS8HxWXOg3uV61G9ijOsup-k9o1sk,91
fai_rl-0.1.15.dist-info/entry_points.txt,sha256=R0R4WJEzjAbhyaGoW7rHQg0YuAP918a-lBO9wIvnMPU,133
fai_rl-0.1.15.dist-info/top_level.txt,sha256=cW5KiCFek4yxEM12BmfbhHrZjVwSBD_APYGPaJj1kT4,78
fai_rl-0.1.15.dist-info/RECORD,,
