Slide 57
Slide 57 text
This is a very very very long gag
PacMan Beispiel
@C_Keibel
env = gym.make(„MsPacman-v0“)
for _ in range(0, x):
state = env.reset()
episode_reward = 0
while not done:
action = get_action(state)
next_state, reward, done, _ = env.step(action)
episode_reward += reward
save_transition(state, action, reward, next_state)
state = next_state
if len(transitions) > min_size:
replay()