diff --git a/simulation_ws/src/rl-agent/markov/environments/mars_env.py b/simulation_ws/src/rl-agent/markov/environments/mars_env.py index 1891868..7eb7d8e 100644 --- a/simulation_ws/src/rl-agent/markov/environments/mars_env.py +++ b/simulation_ws/src/rl-agent/markov/environments/mars_env.py @@ -478,9 +478,9 @@ def reward_function(self): # No Episode ending events - continue to calculate reward - general waypoints not helpful - """ # smooth reward with no waypoints + # smooth reward with no waypoints multiplier = 1 - (self.current_distance_to_checkpoint/INITIAL_DISTANCE_TO_CHECKPOINT)**4 - """ + """ progress = INITIAL_DISTANCE_TO_CHECKPOINT / self.current_distance_to_checkpoint