From eeb077fed1036483234986995bd328ece0eb2e08 Mon Sep 17 00:00:00 2001
From: Timothy Gregg <Timothy.Gregg@complete.tech>
Date: Mon, 4 Aug 2025 19:41:53 -0400
Subject: [PATCH] Avoid zero updates in scheduler

---
 agents/ppo_agent.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/agents/ppo_agent.py b/agents/ppo_agent.py
index 4d1f318..66c6087 100644
--- a/agents/ppo_agent.py
+++ b/agents/ppo_agent.py
@@ -135,6 +135,8 @@ def __init__(self, config, device):
 
         # Add learning rate scheduler for linear decay with minimum LR
         num_updates = config.total_timesteps // (config.n_steps * config.n_envs)
+        # Ensure at least one update to avoid division by zero
+        num_updates = max(num_updates, 1)
         min_lr_ratio = 0.1  # Don't let LR go below 10% of initial
         lr_lambda = lambda update: max(min_lr_ratio, 1.0 - (update / num_updates))
         self.scheduler = torch.optim.lr_scheduler.LambdaLR(self.optimizer, lr_lambda=lr_lambda)