type Episode
steps_remaining::Int
end
# iteration methods... decrement steps_remaining and get the state
env = Env(....)
for state in Episode(env, maxsteps = 100)
# pick an action
act(env, action)
end
note: Env should store the next action to apply so it can be applied (by calling step) in the iterator
Something like:
note: Env should store the next action to apply so it can be applied (by calling
step
) in the iterator