# This file may not be shared/redistributed without permission. Please read copyright notice in the git repo. If this file contains other copyright notices disregard this text. from irlc.pacman.pacman_environment import PacmanEnvironment from irlc.ex01.agent import train from irlc.ex01.agent import Agent from irlc import interactive from irlc.lectures.chapter3dp.dp_pacman import SS1tiny def ppac(layout_str, name="pac"): env = PacmanEnvironment(layout=None, layout_str=layout_str, animate_movement=True) agent = Agent(env) env, agent = interactive(env, agent) # agent = PlayWrapper(agent, env) # env = VideoMonitor(env) stats, _ = train(env, agent, num_episodes=5, max_steps=8) print("Accumulated reward for all episodes:", [s['Accumulated Reward'] for s in stats]) env.close() if __name__ == "__main__": ppac(SS1tiny)