configs/__init__.py,sha256=JPftAl0UOmUEW7_01z1Ldy367-6HDQymLUtb4cB-Os0,41
configs/deepspeed/zero1_config.json,sha256=KP8C66RmQVa_V-jH4j6cAJxH4oOsEVcY8DxMjty9x3M,574
configs/deepspeed/zero3_config.json,sha256=QS2PioI9GW0oAQ0U0-6hkJCig0CGL0Gon-XqvY5t5qI,887
core/__init__.py,sha256=ZLoFWQbRZmA7N3sNO4jhtFWK4XK39WsL9E7SGGXTbPQ,503
core/config.py,sha256=9wnsyb1MewEqPm6s_W-CFYtHe6djRetc4gpak8Z1VS8,13706
core/model_utils.py,sha256=qS9VI0yTambhFd6cvxjCkTHVVFtwF52WRs9hhSjmbQ8,7032
core/trainer_base.py,sha256=dNPYoe7dVLv3r5ICpgEAznWB2WaL7QU9i5FNONrLbDw,14406
evaluations/README.md,sha256=fvhu5T3t0cEdvyxxsWl-0XEfUtsKtIl3Fk1HOTNs3sY,3346
evaluations/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
evaluations/eval.py,sha256=0tTQSKVgCJERBXjYCq0-9_4idAKrk-r3PL5CMGSeKek,24643
evaluations/eval_datasets/__init__.py,sha256=gG93AxYyIvhKzf51Med9CZbTYkWFpBD9SUTIbBlvkh0,320
evaluations/eval_datasets/gsm8k.py,sha256=5NnIp6SXaualIevnGpv0EjjDyU2e4SC4uSZMQyUJB9I,4529
evaluations/eval_datasets/mmlu.py,sha256=DQRZPNNWUxKNwRgBf5atdnKMU5AtxDusuU6amhMI97Q,4419
fai_rl-0.1.18.dist-info/licenses/LICENSE,sha256=NbkVt7vxbqv1qoOi4kNRYn3VzYu1mJ-SLyoByujD9H4,11310
inference/README.md,sha256=GLB-8x2mtQw5dpoZibxFIAybwXtzU7EUueJ4asv7DDA,3892
inference/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
inference/inference.py,sha256=-hMPhLE5HDYZzy8-qf2SeNNdrkaz7neD_oZ-KWnlS-Y,25800
recipes/__init__.py,sha256=JPftAl0UOmUEW7_01z1Ldy367-6HDQymLUtb4cB-Os0,41
recipes/evaluation/gsm8k/llama3_3B_vanilla.yaml,sha256=rQlgO5B64UfqlsRtiDwGl-Qtzd2G0qzl6wCwO8SpTiw,2257
recipes/evaluation/gsm8k/llama3_8B_vanilla.yaml,sha256=gTClptVRlsIcT6rWmC3Sc-Iw2_3n6kBhBwFWt320CQc,2257
recipes/evaluation/gsm8k/qwen3_4B.yaml,sha256=6xYlb3HX9eltGxWUmUdeMps3P-7f2JTP7RZqptTz0k8,2309
recipes/evaluation/gsm8k/qwen3_4B_multi_ckpt.yaml,sha256=0einjqTI2bf-Bq3yY6xd_T4NLrV6h-fIUlzhagok8aA,2459
recipes/evaluation/gsm8k/qwen3_4B_vanilla.yaml,sha256=GNe_zTIK7DjqmgaTmsZ1kY8M7Go1qWn31ROuXAlJ-so,2251
recipes/evaluation/gsm8k/qwen3_8B_vanilla.yaml,sha256=zATcSGQTnImGLDwqhpsRwtOdxar041G1SzurZJ-9qMQ,2232
recipes/evaluation/mmlu/llama3_3B.yaml,sha256=GSKqyzBspZZ9DDTLpzEAB9j2m8W2Vf3YTdNrDiFzOdg,2469
recipes/evaluation/mmlu/llama3_3B_api.yaml,sha256=kuDlu_wcstN8m9Nn0Q0bFOrlpGfhDGurdkt3rtGMe3U,2614
recipes/evaluation/mmlu/llama3_3B_multi_ckpt.yaml,sha256=-KAYT0oxSg06pisv_UiDSSYeb2dTgB9R2ox5dGHE_rU,2739
recipes/evaluation/mmlu/llama3_vanilla_3B.yaml,sha256=Lu2o_lZXWrAuV61A54a_OnhhRP3VvL0qGr7dz8rnSEI,2562
recipes/inference/llama3_3B.yaml,sha256=VTUSmP-ctidPTJvuniedsqGX0m-XXbTKf3vKhLeX918,1974
recipes/inference/llama3_3B_api.yaml,sha256=8KcTDTpSToDxjFaBftr8Kv7DTc0ZofPb2Ru1DjoiyPA,2395
recipes/inference/llama3_3B_local_csv.yaml,sha256=9uQRHyVwAgqgoPHUK818URWeswQBfg9jZR7RLBrPVqU,2091
recipes/inference/llama3_3B_multi_ckpt.yaml,sha256=GeMyfod0i-0TB-xgVJgUNvOASa0m3o5qdMJ4ZclKb2Q,2379
recipes/inference/llama3_vanilla_3B.yaml,sha256=o_-EIzf-H4kl8QiVC3vpXW8wK9OhNjt3F4G6vbbcZAg,2149
recipes/training/cpt/qwen3_30B_A3B_lora.yaml,sha256=X9V015dyzPcPqfKJZ3aV_IoOc9kploDaZaqhhz8OMNA,6133
recipes/training/cpt/qwen3_30B_A3B_qlora.yaml,sha256=oe29zhKerW2BA95cZRhrB0GWYn6TnpKd-Y4X1RmLGVo,6237
recipes/training/cpt/qwen3_4B_lora.yaml,sha256=TtjnTkfnMcqSidpz0qATvNlBe-HxD97Z80FhTl8EHmg,5596
recipes/training/cpt/qwen3_4B_qlora.yaml,sha256=--mUIXPjHP9dMewtaFFt0bmrQR6Scgfq5RS2PLiEwHk,6007
recipes/training/dpo/llama3_3B_full.yaml,sha256=SIFb4KQ4V2stIqLRGVoUS_0wJllJIKV0cNaUYDbl_VQ,6320
recipes/training/dpo/llama3_3B_lora.yaml,sha256=A8YUMsCqM84xLb8i-Zni56piZpAh_GLHr9kCNGgCd90,6921
recipes/training/dpo/llama3_3B_qlora.yaml,sha256=_zpbLWk5Dzc1rt1hKwiFgxPi_34rstQjqnefZzJKJdw,7297
recipes/training/grpo/llama3_3B_full.yaml,sha256=nyyfon5LkugN_OuXFVTmCNT_9yfim4eEmu01SK6DDlY,6294
recipes/training/grpo/llama3_3B_lora.yaml,sha256=oRXAqlc_iV0rdPsp5P9rC3D8F9C9dSfCxd3NZ-EA2q4,6897
recipes/training/gspo/llama3_3B_full.yaml,sha256=72Jhs89QnAds9SWFNu1q0wrfefrn1fOhe_3D68tgVt0,6908
recipes/training/gspo/llama3_3B_lora.yaml,sha256=ffTZNo_cyiNFDq7FXQK6F5lvlun5Ri96EXXCTbh489E,7579
recipes/training/ppo/llama3_3B_full.yaml,sha256=gwPnmcFhOZcHa5EIvJ2pu17dZz2__g0ft_T1V7Lb60c,5719
recipes/training/ppo/llama3_3B_lora.yaml,sha256=R84-ylI4PAm89pN0KcrTNnqeEFeDvfGCNQpHEoKPpeU,6394
recipes/training/ppo/llama3_3B_qlora.yaml,sha256=iLKWN4J_351wNhAAx1UZs2XAhdPW4WTEMTdnlbx7-6M,6760
recipes/training/sft/llama3_3B_full.yaml,sha256=PBzqvPkFrZbP8joNXWofENtzC5cEYWyGXRyciN-ga8g,6232
recipes/training/sft/llama3_3B_lora.yaml,sha256=8uc1tIQXe4NzuNc3ipi20xKrCgSCzYmzB_DQo_T3dkA,6827
recipes/training/sft/llama3_3B_qlora.yaml,sha256=N3yj9C81vzZ77oxwGFO5t1-gGyGvMJKTsviCyvJ5vUo,7192
trainers/README.md,sha256=exFjJWsziSQGOXRhzgOpc_5uOrkuR7xLJG8FxF325_I,6714
trainers/__init__.py,sha256=4-J2h1APE3LHEJNDAg-ikNgN64LC7MHcHIauw7L7w4M,323
trainers/cpt_trainer.py,sha256=epIU4yOvyGMLP0D4bR7TQYqMvASKQCTTG2MIpaS6paw,7005
trainers/dpo_trainer.py,sha256=tS65VvZP1gDtXZKJErs9e1ETvMgCq4EtbA9FQ9D1Wko,9885
trainers/grpo_trainer.py,sha256=Kuaolax1l4mINais7qL_pg1Sze2N9SJImddGPYbqr8s,10775
trainers/gspo_trainer.py,sha256=XT7CgCnn_ll7Ep3BVk_2FNMlPLCx9o0F3AUoyy3RQ3Q,11181
trainers/sft_trainer.py,sha256=RjAZ8LnZSxGv0pVxDBT9GS8vaEMRVw9CRGa8ncB2RG4,8403
trainers/train.py,sha256=D24Br42r5xxAqPUAYZ5DD2Gy9mJFB7JmR8-O8GjKuhY,17248
trainers/rewards/__init__.py,sha256=1n7-T_HVBsCUh6g3VSA9kbkYZtKOxP4xcZtZN7lKS_k,138
trainers/rewards/accuracy_rewards.py,sha256=_UaSi9AO3YU7F7ElQDHjwGRPtSyzWgkV1Jy2wpObvAg,2012
trainers/rewards/custom_rewards.py,sha256=wU5kdglfVwSLh-yQYZMaOqjzzRuZ2oToAuz4n-U2l6w,1815
trainers/rewards/format_rewards.py,sha256=9yyMqLll0-1Koh1hCdsu33RtQ3jO3QaQeTQrRJHuSMk,684
trainers/templates/__init__.py,sha256=LjHvIpd2MlC5KXj-ytZeGlB6RKBdxse-SmNs5KX9Kto,210
trainers/templates/gsm8k_template.py,sha256=QE4ztuGHCkcxfFpRtF0laEfkqVeexT3R9594TIWmhRM,1568
trainers/templates/openmathinstruct_template.py,sha256=A09p8_pqJ1ncdFoj377bF37v9IsN-wUj31gorP8Mda0,1410
utils/__init__.py,sha256=Lfu5757fBA3Pqy2G8QGbSG090Lp_E09vb26iha4049s,1515
utils/api_utils.py,sha256=f1p9ucSc-r70Cs3g8KULL7cBXIRKcnEHHi5wDeGKK_s,12581
utils/config_validation.py,sha256=Lxy_8jZY0OyMI1rv8Xk3Kka6TCr16gSzW318dh3WTqg,1751
utils/dataset_utils.py,sha256=NIIvvcU75PGOWid8Vu7CY60gCG2KV5PHXvfSBn9NlQU,1520
utils/device_utils.py,sha256=dmgSHXgvasnFMQUN8y1MAvVI24eyJDUnNMCmAWFtpkE,16355
utils/hosted_llm_config.py,sha256=vBbPrFyWTy8VKKmb67DU3xZ0pTrqF6O5fcPCMnfjFQ8,8598
utils/logging_utils.py,sha256=77OILPp7ZY7dQZGc-O8Yt0yMgNm1cCQMf5Rjy9hA1Tg,10783
utils/recipe_overrides.py,sha256=iJfaWxv4f95EVacXTRmSk4jFCjxrzd-A7dCmZRAaWME,2642
utils/s3_utils.py,sha256=x_VM9BxZnbZFpLhvSXqmdmBL2T9NiYzAJ22xs93EUTE,8502
venv_deploy/share/jupyter/kernels/python3/kernel.json,sha256=69y5qspxusKKSbKfpYw86C4_UFV01AU6NtRuUi9t-kI,193
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/install.json,sha256=e65KcDNtdaA4aZgF1mLHIhwaoIzpH9LmUueG4iJYmI0,197
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/package.json,sha256=vmebfycAy9ffbvozQULkX7ZwWimcOH7gX3pG2PctTHE,3551
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/schemas/@jupyter-widgets/jupyterlab-manager/plugin.json,sha256=IWNBmBm-GTATCrzha5m-Kh0Gt6H4KzGsnzcuSigjx2A,375
venv_deploy/share/jupyter/labextensions/@jupyter-widgets/jupyterlab-manager/static/third-party-licenses.json,sha256=rAEtxqfQ91D1yZL60D4LaDq1y5tR-5HE0ih2wdIEZoY,32961
fai_rl-0.1.18.dist-info/METADATA,sha256=8phHFsmUplztWFWYen68pEUYhlzX_5cKCE_3Ipr1BZA,18317
fai_rl-0.1.18.dist-info/WHEEL,sha256=aeYiig01lYGDzBgS8HxWXOg3uV61G9ijOsup-k9o1sk,91
fai_rl-0.1.18.dist-info/entry_points.txt,sha256=R0R4WJEzjAbhyaGoW7rHQg0YuAP918a-lBO9wIvnMPU,133
fai_rl-0.1.18.dist-info/top_level.txt,sha256=71UuZ28xRoqhQLaGSSNEf1JPzXbT2OP8SEV6g4ig07A,70
fai_rl-0.1.18.dist-info/RECORD,,
