Stop zero initializing the SAC networks This makes gradient decent super hard, and it fails to converge. The default random initialization is much better. Change-Id: I96465dad8313e5101a58365fee4458ffe7336442 Signed-off-by: Austin Schuh <austin.linux@gmail.com>

commit: 96c0f25f69a04f4cfb76441500b89433ee2ae859 [log] [tgz]
author: Austin Schuh <austin.linux@gmail.com> Sat Oct 19 14:35:48 2024 -0700
committer: Austin Schuh <austin.linux@gmail.com> Sat Oct 26 14:58:55 2024 -0700
tree: 54a7778be674351dd6414759d55998e8f81219a4
parent: 5dac229f5da196f1191e16d713e81d0adf1b46ed [diff]
diff --git a/frc971/control_loops/swerve/velocity_controller/model.py b/frc971/control_loops/swerve/velocity_controller/model.py
index 0d8a410..1394463 100644
--- a/frc971/control_loops/swerve/velocity_controller/model.py
+++ b/frc971/control_loops/swerve/velocity_controller/model.py

@@ -113,7 +113,6 @@
         mu = nn.Dense(
             features=self.action_space,
             name='mu',
-            kernel_init=nn.initializers.zeros,
         )(x)
 
         log_std_layer = nn.Dense(features=self.action_space,
@@ -180,8 +179,10 @@
             )(x)
             x = self.activation(x)
 
-        x = nn.Dense(name=f'q', features=1,
-                     kernel_init=nn.initializers.zeros)(x)
+        x = nn.Dense(
+            name=f'q',
+            features=1,
+        )(x)
 
         return x
commit	96c0f25f69a04f4cfb76441500b89433ee2ae859	[log] [tgz]
author	Austin Schuh <austin.linux@gmail.com>	Sat Oct 19 14:35:48 2024 -0700
committer	Austin Schuh <austin.linux@gmail.com>	Sat Oct 26 14:58:55 2024 -0700
tree	54a7778be674351dd6414759d55998e8f81219a4
parent	5dac229f5da196f1191e16d713e81d0adf1b46ed [diff]