Updated grad clips

2023-12-10 06:55:07 +01:00 · 2023-12-10 06:55:07 +01:00 · 939a90dd0f
commit 939a90dd0f
parent 85c1532920
10 changed files with 4 additions and 2 deletions
--- a/agents/.DS_Store
+++ b/agents/.DS_Store
--- a/agents/ppo/agent.py
+++ b/agents/ppo/agent.py
@ -104,14 +104,16 @@ class Agent:
                T.nn.utils.clip_grad_norm_(
                    self.actor.parameters(), max_norm=2)
                T.nn.utils.clip_grad_norm_(
                    self.critic.parameters(), max_norm=2)
                # Calculate the gradient norms for both networks
                actor_grad_norm = T.nn.utils.clip_grad_norm_(
-                    self.actor.parameters(), max_norm=1)
+                    self.actor.parameters(), max_norm=2)
                critic_grad_norm = T.nn.utils.clip_grad_norm_(
-                    self.critic.parameters(), max_norm=1)
+                    self.critic.parameters(), max_norm=2)
                # Log or print the gradient norms
                print(f"Actor Gradient Norm: {actor_grad_norm}")
--- a/agents/saved_models/A0
+++ b/agents/saved_models/A0
--- a/agents/saved_models/C0
+++ b/agents/saved_models/C0
--- a/figures/older_figures/actor_loss.png
+++ b/figures/older_figures/actor_loss.png
--- a/figures/older_figures/critic_loss.png
+++ b/figures/older_figures/critic_loss.png
--- a/figures/older_figures/score.png
+++ b/figures/older_figures/score.png
--- a/figures/older_figures/total_loss.png
+++ b/figures/older_figures/total_loss.png
--- a/figures/score.png
+++ b/figures/score.png
--- a/figures/total_loss.png
+++ b/figures/total_loss.png