rlai/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
rlai/core/__init__.py,sha256=SpYG0EnAciQWssm_souvyg3iDsgth_gKAn1tLvEerpg,41582
rlai/core/environments/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
rlai/core/environments/bandit.py,sha256=zlFSPDabV9J2BRO1a_r0o3tSi4UbLpc_fB9Eh30y1qw,6976
rlai/core/environments/gamblers_problem.py,sha256=ZVwOHmH7saKZSN4Prgjshos8CGcI6cZkEN0IiEmsFiA,4157
rlai/core/environments/gridworld.py,sha256=gMyLuB0n-sUQ6AdFFfa74cHCliUQRdA4Y1CsRCC8-vM,13407
rlai/core/environments/gymnasium.py,sha256=gKGILWdDYAL9EtRrNFBFhWGg3rGcKwOO-YIUUvfn2fA,63252
rlai/core/environments/mancala.py,sha256=oUODYP653xIvT1Blc2PjsEXGzgtjc0YayPRfFUt_2DI,14782
rlai/core/environments/mdp.py,sha256=MhxVUfc1VJiae0oPdLmI4twzuQbDQ0U8UW5-hZeWiuY,27232
rlai/core/environments/network.py,sha256=kSG0BmAfWOq8RyKDixLgpga_M7UTf2oI5_Zq1yJKWgM,7025
rlai/core/environments/robocode.py,sha256=12ac7-NtgPjI0WBdyaOsYiwc0QfNBJyZduNZiTij6uw,55089
rlai/core/environments/robocode_continuous_action.py,sha256=q72IKTUJud7Fwa7K_KikVX6C8HIpb3lEs-BXGvXjoYw,49336
rlai/docs.py,sha256=hgyfOG-2PtNLQdqGFywFA7yhtk9NkROhquLGtz0mCXo,7241
"rlai/figures/Epsilon-greedy with decreasing epsilon, bandit.pdf",sha256=X4N8pTBNdLiZM8i7eSgWcTThJSiDwlNpNa5yjAHTWKE,69585
"rlai/figures/Epsilon-greedy with recency-weighted reward average, nonstationary bandit.pdf",sha256=4jyhEtOTOual5wtp5__3JRKk2T61p9dCx_DxKvjUizg,70718
"rlai/figures/Epsilon-greedy, nonstationary bandit.pdf",sha256=dYQhpRaMR2wzQF95lg_VUlBjGrdC5XTJX6bNKa6MEXg,73402
"rlai/figures/Figure 2.2: Epsilon-greedy, bandit.pdf",sha256=2ku_ffPs_d22r3s463NAWego5PLS5NlAUqOzRgTATSg,70091
"rlai/figures/Figure 2.3:  Greedy with optimistic initial values and recency-weighted reward average, bandit.pdf",sha256=ncUsUNeizxUiMIRTszo5quFzL5kcYKUdHgCYFA9ECFE,34754
"rlai/figures/Figure 2.4:  Upper confidence bound, bandit.pdf",sha256=kEVPS2nHsFAa3ug0sb66dZ2d1oO22JIBuKvEwTSHwFc,53164
"rlai/figures/Figure 2.5:  Preference gradient no baseline, bandit.pdf",sha256=DgZmsNufc6xrmOKQPrQZn0JyI1IBkW3x9U5Wal4rM3o,33168
"rlai/figures/Figure 2.5:  Preference gradient, bandit.pdf",sha256=tnWf9fd2xCVqdTdjKF7_cXrl0IQcdG0vz_7uHs9OxMg,33473
rlai/figures/Mancala Learning.png,sha256=SmiSh1x42kqh3zeTrJhwCsrXVmPJnF5rDPZvIfabadE,51954
"rlai/figures/Quick run:  Epsilon-greedy, bandit.pdf",sha256=nYzPGfq8URR1Vj0UYvrn_JYOb4CgLTKYSeEhsNFgBcY,32853
rlai/gpi/__init__.py,sha256=fm-hv3PeUJtmTBfNATuwmF6VuJepyCyeMd5ftjWDyRM,384
rlai/gpi/dynamic_programming/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
rlai/gpi/dynamic_programming/evaluation.py,sha256=051M6N_ECX7r0sImgibBvvD_moTD3HUfptX9f5LdehM,9402
rlai/gpi/dynamic_programming/iteration.py,sha256=juZiEWJTPHGeUPzBsfsThl3Ty69yv8ea4OFcj7vjg4M,6488
rlai/gpi/monte_carlo/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
rlai/gpi/monte_carlo/evaluation.py,sha256=pSodCwTEOUfGqm8syiPmpCGblaVshuZqeNA9fDPAdQU,13411
rlai/gpi/monte_carlo/iteration.py,sha256=AsgFtBuTAqw10dTVv7dvQf_tMAyrQSoEfNV-uQgtOeU,8041
rlai/gpi/state_action_value/__init__.py,sha256=ztC9DNXkWxJ2wWoELWxjynEp7LWhrXOobsdgJKz91AQ,11117
rlai/gpi/state_action_value/function_approximation/__init__.py,sha256=wOVXQE6-GZkqjLSZG4u9PiQCKlrg9KsORjfRzeKfskE,24370
rlai/gpi/state_action_value/function_approximation/models/__init__.py,sha256=jNcQ1RsTrq_l1lYkO3hRQ9XOd8rV8dq2idPYdATTtMA,9003
rlai/gpi/state_action_value/function_approximation/models/feature_extraction.py,sha256=06X-YD9Z_fA4tr4sdOm0jTSKiGsd8-c8zui0dVPgCtM,8466
rlai/gpi/state_action_value/function_approximation/models/sklearn.py,sha256=segBoGS7y4BO73Kiz4ZTrBi0oqAjeEHyMNelUQKwtJE,7470
rlai/gpi/state_action_value/tabular.py,sha256=4-54BZ_njGOealQpLA73HqPwqMdh08TLk4RppDslXoM,22339
rlai/gpi/temporal_difference/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
rlai/gpi/temporal_difference/evaluation.py,sha256=T5oNhtuE3mXIgo7_j0uhy7nU3UmPD-NO5CbZh_Na2-o,19377
rlai/gpi/temporal_difference/iteration.py,sha256=evyuEtttgDb8cQeZZvbrtQu0Bz4rZIwTUBw3iwT8f8A,9381
rlai/gpi/utils.py,sha256=hLdVaiiTnkchoUn6sN-eELZH45yV37RA4rpMD4T7Fjo,9217
rlai/models/__init__.py,sha256=OvvltIS70vhA9XqluEdTEevA0Hk-HmSk29zfIW4B30M,2587
rlai/models/feature_extraction.py,sha256=ZqqEzHt0HzDbD6fehqw6nMNC6ipPD3bjRrNEpU_uDKM,16657
rlai/models/sklearn.py,sha256=Chix9hJpECfVviCJcXmhRThEQrP3KAIjR4wL0StYGJ0,21476
rlai/plot_utils.py,sha256=5nbtS4jhxqzaVBAX6PJQcMiLFOxct10VYUfOFKyA3T0,6732
rlai/policy_gradient/__init__.py,sha256=Lx5EGAMGhlGceEIpIJlWh83qjmPp_4zsHCnNiHFdzcU,3915
rlai/policy_gradient/monte_carlo/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
rlai/policy_gradient/monte_carlo/reinforce.py,sha256=mNLWrsixz34W6IwXfCX3RuJn5QDt3G3ZGi2LPgkSRiQ,39570
rlai/policy_gradient/policies/__init__.py,sha256=Y1QBRhBaDU_eq9BG2lYF2SlYl49l0A9rIzFwsQF3PZA,2396
rlai/policy_gradient/policies/continuous_action.py,sha256=5OD-bFWJIcu0i-dnyfR20E5qVEsvpGffewzF0VsSXmQ,37641
rlai/policy_gradient/policies/discrete_action.py,sha256=pgKXwatzZgX8YpE7fulASnYMLh1DHjrdbtxctkq2aqQ,15782
rlai/policy_gradient/utils.py,sha256=PYv-YI_qaLBDvEhMg99YlZSBIc6RHlJt9sQ98D30Smk,412
rlai/runners/__init__.py,sha256=47DEQpj8HBSa-_TImW-5JCeuQeRkm5NMpJWZG3hSuFU,0
rlai/runners/agent_in_environment.py,sha256=62ybGguP0rsqv4bFzntjdJPaZuwGbp0WnuktRVEmIwQ,7010
rlai/runners/top_level.py,sha256=jtT1yMbmv4AkBeu9VApMCWnpiobe2P-JCsHu3czhC7Y,1592
rlai/runners/trainer.py,sha256=AvyLp1E8fCQuSI6bWAwRxdziaYzrWkykpJ_NxkjTE2M,13647
rlai/state_value/__init__.py,sha256=RdRXyJfj3pHMRo1Pg6GZJS2Pam49jSj6PMiJVZCEGvs,3698
rlai/state_value/function_approximation/__init__.py,sha256=89MJxO4S2rndxD9Oq_tOaDURuMRbFkps0DKfX9YWQy0,10429
rlai/state_value/function_approximation/models/__init__.py,sha256=V5WxjiM6f6LJLYBb0HmUGwc85jePNZ_vR85RNU5He1c,1241
rlai/state_value/function_approximation/models/feature_extraction.py,sha256=peQAbl4bkHvBEyqnI7T-U68sXdSAf0Wl3Vhgj5Z2dew,9712
rlai/state_value/function_approximation/models/sklearn.py,sha256=noMYE14fenIdImKTfEF0s9d_G_Ywh3THvQCPOxLDuJw,4190
rlai/utils.py,sha256=l_TMdhEV2Ng9xdd3ufAnbAPHwl9ztKu-VvT1UTD5gpA,16859
rlai-1.6.0.dist-info/METADATA,sha256=L4PgCIPEEFC53dvv0q8JYhfOgyBZ5QpoS98HPaTgnLE,12064
rlai-1.6.0.dist-info/WHEEL,sha256=EGEvSphFYqXKs23-kQBeyNoJP1nrT8ZJKQoi5p5DYL8,88
rlai-1.6.0.dist-info/entry_points.txt,sha256=3r91xPzcjjSiL_5IWH_5jL1n_-c5pd1wjdQO2QNXXPg,51
rlai-1.6.0.dist-info/licenses/LICENSE,sha256=FF_9fiJxStFD9z5Oskliny-BX6dqSfOwEzpfF-INb-U,1071
rlai-1.6.0.dist-info/RECORD,,
