Remove dropout at evaluation time on GPI-LS (#90)

LucasAlegre · Jan 25, 2024 · 9afcb3a · 9afcb3a
1 parent 6688e0f
commit 9afcb3a
Showing 1 changed file with 4 additions and 0 deletions.
diff --git a/morl_baselines/multi_policy/gpi_pd/gpi_pd.py b/morl_baselines/multi_policy/gpi_pd/gpi_pd.py
@@ -588,10 +588,14 @@ def eval(self, obs: np.ndarray, w: np.ndarray) -> int:
         """Select an action for the given obs and weight vector."""
         obs = th.as_tensor(obs).float().to(self.device)
         w = th.as_tensor(w).float().to(self.device)
+        for q_net in self.q_nets:
+            q_net.eval()
         if self.use_gpi:
             action = self.gpi_action(obs, w, include_w=False)
         else:
             action = self.max_action(obs, w)
+        for q_net in self.q_nets:
+            q_net.train()
         return action
 
     def _act(self, obs: th.Tensor, w: th.Tensor) -> int: