From ed2750ebc906fed622241279a9aca17baae5f080 Mon Sep 17 00:00:00 2001 From: Tue Herlau <tuhe@dtu.dk> Date: Thu, 1 May 2025 12:41:56 +0200 Subject: [PATCH] Not so secret agents for some of the in-class demos --- irlc/gridworld/demo_agents/hidden_agents.py | 9 +++++++++ 1 file changed, 9 insertions(+) diff --git a/irlc/gridworld/demo_agents/hidden_agents.py b/irlc/gridworld/demo_agents/hidden_agents.py index d831b11..6414662 100644 --- a/irlc/gridworld/demo_agents/hidden_agents.py +++ b/irlc/gridworld/demo_agents/hidden_agents.py @@ -63,6 +63,10 @@ class PolicyEvaluationAgent2(TabularAgent): self.policy[s][a] = 1/len(mdp.A(s)) super().__init__(env, gamma) + def reset(self): + self.v = defaultdict(lambda: 0) + + def pi(self, s,k, info=None): # TODO: 1 lines missing. @@ -162,6 +166,11 @@ class ValueIterationAgent3(TabularAgent): self.policy[s][a] = 1/len(mdp.A(s)) super().__init__(env, gamma, epsilon=epsilon) + def reset(self): + self.v = defaultdict(lambda: 0) + self.Q.q_.clear() + + def pi(self, s,k, info=None): from irlc import Agent -- GitLab