Newer
Older
# This file may not be shared/redistributed without permission. Please read copyright notice in the git repo. If this file contains other copyright notices disregard this text.
from irlc.pacman.pacman_environment import PacmanEnvironment
from irlc.ex01.agent import train
from irlc.ex01.agent import Agent
from irlc import interactive
from irlc.lectures.chapter3dp.dp_pacman import SS1tiny
def ppac(layout_str, name="pac"):
env = PacmanEnvironment(layout=None, layout_str=layout_str, animate_movement=True)
agent = Agent(env)
env, agent = interactive(env, agent)
# agent = PlayWrapper(agent, env)
# env = VideoMonitor(env)
stats, _ = train(env, agent, num_episodes=5, max_steps=8)
print("Accumulated reward for all episodes:", [s['Accumulated Reward'] for s in stats])
env.close()
if __name__ == "__main__":
ppac(SS1tiny)