From 6d57d04100d5dac6ec499c566d2930acbfee93cf Mon Sep 17 00:00:00 2001 From: Matthew Gerber Date: Tue, 26 Dec 2023 13:28:38 -0500 Subject: [PATCH] Finish not fitting intercept if extractor provides one. --- run_configurations/CartPole train FA.run.xml | 3 +- .../MountainCar continuous train FA.run.xml | 2 +- src/rlai/core/environments/gridworld.py | 25 ++- src/rlai/core/environments/gymnasium.py | 181 ++++++++++++------ src/rlai/core/environments/robocode.py | 15 +- .../robocode_continuous_action.py | 15 +- .../function_approximation/__init__.py | 17 +- .../models/feature_extraction.py | 11 ++ .../function_approximation/models/sklearn.py | 23 ++- src/rlai/models/__init__.py | 4 +- src/rlai/models/feature_extraction.py | 30 ++- src/rlai/models/sklearn.py | 18 +- .../policies/continuous_action.py | 37 ++-- .../policies/discrete_action.py | 2 +- .../function_approximation/__init__.py | 17 +- src/rlai/utils.py | 2 +- ..._carlo_with_function_approximationo.pickle | Bin 5675 -> 5704 bytes test/rlai/gpi/monte_carlo/iteration_test.py | 2 +- ...i_function_approximation_no_formula.pickle | Bin 5676 -> 5704 bytes .../parameterized/continuous_action_test.py | 4 +- ...t_manual_versus_jax_policy_gradient.pickle | Bin 4443 -> 4023 bytes .../monte_carlo/fixtures/test_resume.pickle | Bin 81423 -> 19718 bytes ...st_continuous_action_discretization.pickle | Bin 22793 -> 25373 bytes .../test_gridworld_plot_model_pdf.pickle | Bin 6215 -> 6246 bytes ...gym_cartpole_function_approximation.pickle | Bin 694940 -> 695000 bytes ...e_function_approximation_plot_model.pickle | Bin 694941 -> 695001 bytes .../test_gym_continuous_mountain_car.pickle | Bin 107658 -> 11579 bytes ...adient_reinforce_beta_with_baseline.pickle | Bin 73080 -> 19684 bytes ...ient_reinforce_normal_with_baseline.pickle | Bin 69222 -> 18316 bytes ...ax_action_preferences_with_baseline.pickle | Bin 5755 -> 6171 bytes ...ction_interaction_feature_extractor.pickle | Bin 6213 -> 6245 bytes .../test_sarsa_with_model_plots.pickle | Bin 6216 -> 6247 bytes test/rlai/runners/monitor_test.py | 6 +- test/rlai/runners/trainer_test.py | 4 +- 34 files changed, 278 insertions(+), 140 deletions(-) diff --git a/run_configurations/CartPole train FA.run.xml b/run_configurations/CartPole train FA.run.xml index 2b2f3e26..68ba0c1c 100644 --- a/run_configurations/CartPole train FA.run.xml +++ b/run_configurations/CartPole train FA.run.xml @@ -1,6 +1,7 @@ +