diff --git a/webots/controllers/RL_Supervisor/agent.py b/webots/controllers/RL_Supervisor/agent.py
index 45769c8..82dafa9 100644
--- a/webots/controllers/RL_Supervisor/agent.py
+++ b/webots/controllers/RL_Supervisor/agent.py
@@ -108,7 +108,8 @@ def __init__(
         self.__chkpt_dir = chkpt_dir
         self.train_mode = False
         self.__top_speed = top_speed
-        self.__std_dev = 0.05
+        self.__std_dev = 0.05   # When training without an existing model this should be
+                                # set to 0.9 manually
         self.__memory = Memory(batch_size, max_buffer_length, gamma, gae_lambda)
         self.__neural_network = Models(actor_alpha, critic_alpha, self.__std_dev, policy_clip)
         self.__training_index = 0  # Track batch index during training