Skip to content

Commit

Permalink
added max_episode_steps to satisfy reward implementation
Browse files Browse the repository at this point in the history
  • Loading branch information
AlexanderManich committed Apr 15, 2024
1 parent 83089b4 commit 6fd0e11
Showing 1 changed file with 14 additions and 0 deletions.
14 changes: 14 additions & 0 deletions src/fastfiz_env/envs/velocity_fastfiz.py
Original file line number Diff line number Diff line change
Expand Up @@ -36,6 +36,17 @@ def __init__(
self.table_state = create_table_state(self.num_balls)
self.observation_space = self._observation_space()
self.action_space = self._action_space()
self.max_episode_steps = None

def _max_episode_steps(self):
if (
#hasattr(SimpleFastFiz, "_time_limit_max_episode_steps")
self.get_wrapper_attr("_time_limit_max_episode_steps") is not None
):
self.max_episode_steps = self.get_wrapper_attr(
"_time_limit_max_episode_steps"
)
self.reward.max_episode_steps = self.max_episode_steps

def reset(
self, *, seed: Optional[int] = None, options: Optional[dict] = None
Expand All @@ -45,6 +56,9 @@ def reset(
"""
super().reset(seed=seed)

if self.max_episode_steps is None:
self._max_episode_steps()

self.table_state = create_table_state(self.num_balls)
self.reward.reset(self.table_state)
observation = self._get_observation(self.table_state, [])
Expand Down

0 comments on commit 6fd0e11

Please sign in to comment.