LICENSE
MANIFEST.in
README.md
setup.py
mavrl/__init__.py
mavrl/learned_reward_wrapper.py
mavrl/losses.py
mavrl/multi_fb_model.py
mavrl/priors.py
mavrl/true_reward_callback.py
mavrl/types.py
mavrl.egg-info/PKG-INFO
mavrl.egg-info/SOURCES.txt
mavrl.egg-info/dependency_links.txt
mavrl.egg-info/requires.txt
mavrl.egg-info/top_level.txt
mavrl/active_learning/__init__.py
mavrl/active_learning/human_simulator.py
mavrl/active_learning/information_gain.py
mavrl/active_learning/online_learner.py
mavrl/active_learning/query_generator.py
mavrl_experiments/__init__.py
mavrl_experiments/cli.py
mavrl_experiments/config.py
mavrl_experiments/config_loader.py
mavrl_experiments/equal_budget_table.py
mavrl_experiments/evaluation_worker.py
mavrl_experiments/file_queue.py
mavrl_experiments/fixed_allocation_table.py
mavrl_experiments/fixed_allocation_watch.py
mavrl_experiments/online_worker.py
mavrl_experiments/optuna_budget_table.py
mavrl_experiments/optuna_budget_watch.py
mavrl_experiments/optuna_propagate.py
mavrl_experiments/optuna_search.py
mavrl_experiments/select_best.py
mavrl_experiments/table.py
mavrl_experiments/utils.py
mavrl_experiments/visualize.py
mavrl_experiments/worker.py
mavrl_experiments/configs/experiments/eval_grid_cliff_baseline.py
mavrl_experiments/configs/experiments/eval_grid_sparse_baseline.py
mavrl_experiments/configs/experiments/eval_grid_trap_baseline.py
mavrl_experiments/configs/experiments/eval_lander_baseline.py
mavrl_experiments/configs/experiments/online_al_grid_trap.py
mavrl_experiments/configs/experiments/rb_prefs-demos-ratings_08-01-2026.py
mavrl_experiments/configs/experiments/rb_prefs-demos_07-01-2026.py
mavrl_experiments/configs/experiments/sweep_acrobot.py
mavrl_experiments/configs/experiments/sweep_acrobot_full.py
mavrl_experiments/configs/experiments/sweep_cartpole.py
mavrl_experiments/configs/experiments/sweep_cartpole_full.py
mavrl_experiments/configs/experiments/sweep_grid_cliff.py
mavrl_experiments/configs/experiments/sweep_grid_cliff_full.py
mavrl_experiments/configs/experiments/sweep_grid_sparse.py
mavrl_experiments/configs/experiments/sweep_grid_sparse_full.py
mavrl_experiments/configs/experiments/sweep_grid_trap.py
mavrl_experiments/configs/experiments/sweep_grid_trap_demo_misspec.py
mavrl_experiments/configs/experiments/sweep_grid_trap_full.py
mavrl_experiments/configs/experiments/sweep_grid_trap_mavrl_misspec.py
mavrl_experiments/configs/experiments/sweep_grid_trap_pref_misspec.py
mavrl_experiments/configs/experiments/sweep_grid_trap_rating_misspec.py
mavrl_experiments/configs/experiments/sweep_grid_trap_stop_misspec.py
mavrl_experiments/configs/experiments/sweep_lander.py
mavrl_experiments/configs/experiments/sweep_lander_full.py
mavrl_experiments/configs/experiments/transfer_acrobot.py
mavrl_experiments/configs/experiments/transfer_acrobot_tiny.py
mavrl_experiments/configs/experiments/transfer_grid_cliff.py
mavrl_experiments/configs/experiments/transfer_grid_trap.py
mavrl_experiments/configs/experiments/transfer_lander.py
mavrl_experiments/configs/experiments/ym_halfcheetah.py
mavrl_experiments/configs/optuna/acrobot_v1.py
mavrl_experiments/configs/optuna/acrobot_v1_fixed.py
mavrl_experiments/configs/optuna/acrobot_v1_fixed_paper.py
mavrl_experiments/configs/optuna/cartpole_v1.py
mavrl_experiments/configs/optuna/cartpole_v1_fixed.py
mavrl_experiments/configs/optuna/cartpole_v1_fixed_paper.py
mavrl_experiments/configs/optuna/grid_cliff.py
mavrl_experiments/configs/optuna/grid_cliff_fixed.py
mavrl_experiments/configs/optuna/grid_cliff_fixed_paper.py
mavrl_experiments/configs/optuna/grid_sparse.py
mavrl_experiments/configs/optuna/grid_sparse_fixed.py
mavrl_experiments/configs/optuna/grid_sparse_fixed_paper.py
mavrl_experiments/configs/optuna/grid_trap.py
mavrl_experiments/configs/optuna/grid_trap_fixed.py
mavrl_experiments/configs/optuna/grid_trap_fixed_paper.py
mavrl_experiments/configs/optuna/lunar_lander_v3.py
mavrl_experiments/configs/optuna/lunar_lander_v3_fixed.py
mavrl_experiments/configs/optuna/lunar_lander_v3_fixed_paper.py
tests/__init__.py
tests/test_cache_e2e.py
tests/test_datasets.py
tests/test_demo_nll.py
tests/test_epic.py
tests/test_human_simulator.py
tests/test_pref_nll.py
tests/test_rating_nll.py
tests/test_simulate_response.py
tests/test_stop_helpers.py
tests/repro/__init__.py
tests/repro/_repro_helpers.py
tests/repro/conftest.py
tests/repro/repro_diff.py
tests/repro/test_repro_datasets.py
tests/repro/test_repro_e2e_lunarlander.py
tests/repro/test_repro_e2e_tabular.py
tests/repro/test_repro_model_init.py
tests/repro/test_repro_ppo.py
tests/repro/test_repro_primitives.py
tests/repro/test_repro_train_step.py
tests/repro/test_repro_validation.py