configs/__init__.py,sha256=JPftAl0UOmUEW7_01z1Ldy367-6HDQymLUtb4cB-Os0,41
configs/deepspeed/zero1_config.json,sha256=KP8C66RmQVa_V-jH4j6cAJxH4oOsEVcY8DxMjty9x3M,574
configs/deepspeed/zero3_config.json,sha256=QS2PioI9GW0oAQ0U0-6hkJCig0CGL0Gon-XqvY5t5qI,887
core/__init__.py,sha256=ZLoFWQbRZmA7N3sNO4jhtFWK4XK39WsL9E7SGGXTbPQ,503
core/config.py,sha256=ePtCxN1MuVG-v72wi2z-n7hyl3Dyqk_3R0aLc4B7Udw,14482
core/model_utils.py,sha256=qS9VI0yTambhFd6cvxjCkTHVVFtwF52WRs9hhSjmbQ8,7032
core/trainer_base.py,sha256=iU2C91QsDoea9tS9wfHvYHz-RPBj-Lkir7OCnI_4Wks,17319
evaluations/README.md,sha256=fvhu5T3t0cEdvyxxsWl-0XEfUtsKtIl3Fk1HOTNs3sY,3346
evaluations/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
evaluations/eval.py,sha256=0tTQSKVgCJERBXjYCq0-9_4idAKrk-r3PL5CMGSeKek,24643
evaluations/eval_datasets/__init__.py,sha256=gG93AxYyIvhKzf51Med9CZbTYkWFpBD9SUTIbBlvkh0,320
evaluations/eval_datasets/gsm8k.py,sha256=5NnIp6SXaualIevnGpv0EjjDyU2e4SC4uSZMQyUJB9I,4529
evaluations/eval_datasets/mmlu.py,sha256=DQRZPNNWUxKNwRgBf5atdnKMU5AtxDusuU6amhMI97Q,4419
fai_rl-0.1.27.dist-info/licenses/LICENSE,sha256=NbkVt7vxbqv1qoOi4kNRYn3VzYu1mJ-SLyoByujD9H4,11310
inference/README.md,sha256=GLB-8x2mtQw5dpoZibxFIAybwXtzU7EUueJ4asv7DDA,3892
inference/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
inference/inference.py,sha256=-hMPhLE5HDYZzy8-qf2SeNNdrkaz7neD_oZ-KWnlS-Y,25800
recipes/__init__.py,sha256=JPftAl0UOmUEW7_01z1Ldy367-6HDQymLUtb4cB-Os0,41
recipes/evaluation/gsm8k/llama3_3B_vanilla.yaml,sha256=rQlgO5B64UfqlsRtiDwGl-Qtzd2G0qzl6wCwO8SpTiw,2257
recipes/evaluation/gsm8k/llama3_8B_vanilla.yaml,sha256=gTClptVRlsIcT6rWmC3Sc-Iw2_3n6kBhBwFWt320CQc,2257
recipes/evaluation/gsm8k/qwen3_4B.yaml,sha256=6xYlb3HX9eltGxWUmUdeMps3P-7f2JTP7RZqptTz0k8,2309
recipes/evaluation/gsm8k/qwen3_4B_multi_ckpt.yaml,sha256=0einjqTI2bf-Bq3yY6xd_T4NLrV6h-fIUlzhagok8aA,2459
recipes/evaluation/gsm8k/qwen3_4B_vanilla.yaml,sha256=GNe_zTIK7DjqmgaTmsZ1kY8M7Go1qWn31ROuXAlJ-so,2251
recipes/evaluation/gsm8k/qwen3_8B_vanilla.yaml,sha256=zATcSGQTnImGLDwqhpsRwtOdxar041G1SzurZJ-9qMQ,2232
recipes/evaluation/mmlu/llama3_3B.yaml,sha256=GSKqyzBspZZ9DDTLpzEAB9j2m8W2Vf3YTdNrDiFzOdg,2469
recipes/evaluation/mmlu/llama3_3B_api.yaml,sha256=kuDlu_wcstN8m9Nn0Q0bFOrlpGfhDGurdkt3rtGMe3U,2614
recipes/evaluation/mmlu/llama3_3B_multi_ckpt.yaml,sha256=-KAYT0oxSg06pisv_UiDSSYeb2dTgB9R2ox5dGHE_rU,2739
recipes/evaluation/mmlu/llama3_vanilla_3B.yaml,sha256=Lu2o_lZXWrAuV61A54a_OnhhRP3VvL0qGr7dz8rnSEI,2562
recipes/inference/llama3_3B.yaml,sha256=VTUSmP-ctidPTJvuniedsqGX0m-XXbTKf3vKhLeX918,1974
recipes/inference/llama3_3B_api.yaml,sha256=8KcTDTpSToDxjFaBftr8Kv7DTc0ZofPb2Ru1DjoiyPA,2395
recipes/inference/llama3_3B_local_csv.yaml,sha256=9uQRHyVwAgqgoPHUK818URWeswQBfg9jZR7RLBrPVqU,2091
recipes/inference/llama3_3B_multi_ckpt.yaml,sha256=GeMyfod0i-0TB-xgVJgUNvOASa0m3o5qdMJ4ZclKb2Q,2379
recipes/inference/llama3_vanilla_3B.yaml,sha256=o_-EIzf-H4kl8QiVC3vpXW8wK9OhNjt3F4G6vbbcZAg,2149
recipes/training/README.md,sha256=Bdhrdgxf2kRUZifKhD2dWGZVs7UFVLXJk8PWzBVg47g,8302
recipes/training/cpt/qwen3_30B_A3B_lora.yaml,sha256=X9V015dyzPcPqfKJZ3aV_IoOc9kploDaZaqhhz8OMNA,6133
recipes/training/cpt/qwen3_30B_A3B_qlora.yaml,sha256=oe29zhKerW2BA95cZRhrB0GWYn6TnpKd-Y4X1RmLGVo,6237
recipes/training/cpt/qwen3_4B_local_file.yaml,sha256=kcPE2SHEQFYSe1kW5o2VNfnf_cmkYgrw3DSAwrKdPtc,5577
recipes/training/cpt/qwen3_4B_lora.yaml,sha256=TtjnTkfnMcqSidpz0qATvNlBe-HxD97Z80FhTl8EHmg,5596
recipes/training/cpt/qwen3_4B_qlora.yaml,sha256=--mUIXPjHP9dMewtaFFt0bmrQR6Scgfq5RS2PLiEwHk,6007
recipes/training/cpt/qwen3_4B_s3_file.yaml,sha256=WvJ_Guyvr7252zjK16C1WHk-Y9X26sLPKmYhoyldbM0,5808
recipes/training/dpo/llama3_3B_full.yaml,sha256=SIFb4KQ4V2stIqLRGVoUS_0wJllJIKV0cNaUYDbl_VQ,6320
recipes/training/dpo/llama3_3B_local_file.yaml,sha256=kv-EwZHrN6knysf7-l_TJ1m7RDFqLJLVfW1dZq4upl0,6543
recipes/training/dpo/llama3_3B_lora.yaml,sha256=A8YUMsCqM84xLb8i-Zni56piZpAh_GLHr9kCNGgCd90,6921
recipes/training/dpo/llama3_3B_qlora.yaml,sha256=_zpbLWk5Dzc1rt1hKwiFgxPi_34rstQjqnefZzJKJdw,7297
recipes/training/dpo/llama3_3B_s3_file.yaml,sha256=klC5YPKErBBktXwJPJ3Upa29DHwuqx65cNsMxnksWK0,6773
recipes/training/grpo/llama3_3B_full.yaml,sha256=nyyfon5LkugN_OuXFVTmCNT_9yfim4eEmu01SK6DDlY,6294
recipes/training/grpo/llama3_3B_local_file.yaml,sha256=zKgFG9QDjoKEFxSY4XeD5i9cHs4Cw2kzzLjJKScLjFQ,6492
recipes/training/grpo/llama3_3B_lora.yaml,sha256=oRXAqlc_iV0rdPsp5P9rC3D8F9C9dSfCxd3NZ-EA2q4,6897
recipes/training/grpo/llama3_3B_s3_file.yaml,sha256=H_shgXhdHqf95RqNtovW2rPleEXnCgtmm5gFfbEznME,6720
recipes/training/gspo/llama3_3B_full.yaml,sha256=72Jhs89QnAds9SWFNu1q0wrfefrn1fOhe_3D68tgVt0,6908
recipes/training/gspo/llama3_3B_local_file.yaml,sha256=2H8-QO-eO-Dg1tN8Hryuh0oczPWDLFPFlpPSafVJZ0Y,7001
recipes/training/gspo/llama3_3B_lora.yaml,sha256=ffTZNo_cyiNFDq7FXQK6F5lvlun5Ri96EXXCTbh489E,7579
recipes/training/gspo/llama3_3B_s3_file.yaml,sha256=PLTN5Eh4WJN-QvPPzlH68t5taQOZgOcaxBj8_qn-KjM,7229
recipes/training/ppo/llama3_3B_full.yaml,sha256=gwPnmcFhOZcHa5EIvJ2pu17dZz2__g0ft_T1V7Lb60c,5719
recipes/training/ppo/llama3_3B_lora.yaml,sha256=R84-ylI4PAm89pN0KcrTNnqeEFeDvfGCNQpHEoKPpeU,6394
recipes/training/ppo/llama3_3B_qlora.yaml,sha256=iLKWN4J_351wNhAAx1UZs2XAhdPW4WTEMTdnlbx7-6M,6760
recipes/training/sft/llama3_3B_full.yaml,sha256=PBzqvPkFrZbP8joNXWofENtzC5cEYWyGXRyciN-ga8g,6232
recipes/training/sft/llama3_3B_local_file.yaml,sha256=osy_035XO-nUgB_79LDI0_uACxprOt6twmx5Qs0SUT8,6107
recipes/training/sft/llama3_3B_lora.yaml,sha256=8uc1tIQXe4NzuNc3ipi20xKrCgSCzYmzB_DQo_T3dkA,6827
recipes/training/sft/llama3_3B_qlora.yaml,sha256=N3yj9C81vzZ77oxwGFO5t1-gGyGvMJKTsviCyvJ5vUo,7192
recipes/training/sft/llama3_3B_s3_file.yaml,sha256=GARkBa3wgIJmvLNPW6GlXf404CDSAA_NKuB8OHx8mnw,2282
recipes/training/sft/llama3_3B_s3_model.yaml,sha256=2FOMOHpVOlYxhxJaq0DvgDdeN8O3gJQVZz133rdX8Bs,2387
trainers/README.md,sha256=Ls_NWCDwcB52Yb--RcWPPSJZFze8rkNRx4by5s3ygCk,10169
trainers/__init__.py,sha256=4-J2h1APE3LHEJNDAg-ikNgN64LC7MHcHIauw7L7w4M,323
trainers/cpt_trainer.py,sha256=YS6APEOEckPzu5CmRqwUTvrUcI-CAxjgJab3QFFckEM,6874
trainers/dpo_trainer.py,sha256=rgR2S8SN_L_DFvM41E8InSpIBrMbPEi3AMCnImTTMR0,9723
trainers/grpo_trainer.py,sha256=789kx9Xg4BhtR0ptRm6_r3WIyeXCpIfd30zOasBhpWo,10582
trainers/gspo_trainer.py,sha256=ZHSBoCwjzjteLg4UoeKE4JCsLgNsk6dn-qHNz_O9ZfE,10988
trainers/sft_trainer.py,sha256=GEamCg4KSQBw87gV1hHkcGL6U76hlPLjpvMSqeAlHgk,8241
trainers/train.py,sha256=D24Br42r5xxAqPUAYZ5DD2Gy9mJFB7JmR8-O8GjKuhY,17248
trainers/rewards/__init__.py,sha256=1n7-T_HVBsCUh6g3VSA9kbkYZtKOxP4xcZtZN7lKS_k,138
trainers/rewards/accuracy_rewards.py,sha256=_UaSi9AO3YU7F7ElQDHjwGRPtSyzWgkV1Jy2wpObvAg,2012
trainers/rewards/custom_rewards.py,sha256=wU5kdglfVwSLh-yQYZMaOqjzzRuZ2oToAuz4n-U2l6w,1815
trainers/rewards/format_rewards.py,sha256=9yyMqLll0-1Koh1hCdsu33RtQ3jO3QaQeTQrRJHuSMk,684
trainers/templates/__init__.py,sha256=LjHvIpd2MlC5KXj-ytZeGlB6RKBdxse-SmNs5KX9Kto,210
trainers/templates/gsm8k_template.py,sha256=QE4ztuGHCkcxfFpRtF0laEfkqVeexT3R9594TIWmhRM,1568
trainers/templates/openmathinstruct_template.py,sha256=A09p8_pqJ1ncdFoj377bF37v9IsN-wUj31gorP8Mda0,1410
utils/__init__.py,sha256=Lfu5757fBA3Pqy2G8QGbSG090Lp_E09vb26iha4049s,1515
utils/api_utils.py,sha256=f1p9ucSc-r70Cs3g8KULL7cBXIRKcnEHHi5wDeGKK_s,12581
utils/config_validation.py,sha256=Lxy_8jZY0OyMI1rv8Xk3Kka6TCr16gSzW318dh3WTqg,1751
utils/dataset_utils.py,sha256=ka5ALIry7Xma0Hli8P3nNCbwUtQdoNU5OAos1xLDq7U,3568
utils/device_utils.py,sha256=dmgSHXgvasnFMQUN8y1MAvVI24eyJDUnNMCmAWFtpkE,16355
utils/hosted_llm_config.py,sha256=vBbPrFyWTy8VKKmb67DU3xZ0pTrqF6O5fcPCMnfjFQ8,8598
utils/logging_utils.py,sha256=77OILPp7ZY7dQZGc-O8Yt0yMgNm1cCQMf5Rjy9hA1Tg,10783
utils/recipe_overrides.py,sha256=iJfaWxv4f95EVacXTRmSk4jFCjxrzd-A7dCmZRAaWME,2642
utils/s3_utils.py,sha256=-ROIBDxg6uL8msnii7wuzMXDf4qSclPEqWNnqmjYNVE,11945
fai_rl-0.1.27.dist-info/METADATA,sha256=adOu2iDXwKohNbUVN7-s3azj75aJs7hM4JAg14PVos8,18118
fai_rl-0.1.27.dist-info/WHEEL,sha256=aeYiig01lYGDzBgS8HxWXOg3uV61G9ijOsup-k9o1sk,91
fai_rl-0.1.27.dist-info/entry_points.txt,sha256=R0R4WJEzjAbhyaGoW7rHQg0YuAP918a-lBO9wIvnMPU,133
fai_rl-0.1.27.dist-info/top_level.txt,sha256=ghtp5nKBSyHK93kCqsJ-no05ExxWZcxXsaKlB5i7Ml8,58
fai_rl-0.1.27.dist-info/RECORD,,
