chirbard
/

ppo-Worm

@@ -32,4 +32,33 @@ tags:
   2. Step 1: Find your model_id: chirbard/ppo-Worm
   3. Step 2: Select your *.nn /*.onnx file
   4. Click on Watch the agent play 👀

   2. Step 1: Find your model_id: chirbard/ppo-Worm
   3. Step 2: Select your *.nn /*.onnx file
   4. Click on Watch the agent play 👀
+  ## Hyperparameters
+  ```
+  behaviors:
+    Worm:
+      trainer_type: ppo
+      hyperparameters:
+        batch_size: 2024
+        buffer_size: 20240
+        learning_rate: 0.0003
+        beta: 0.005
+        epsilon: 0.2
+        lambd: 0.95
+        num_epoch: 3
+        learning_rate_schedule: linear
+      network_settings:
+        normalize: true
+        hidden_units: 512
+        num_layers: 3
+        vis_encode_type: simple
+      reward_signals:
+        extrinsic:
+          gamma: 0.9995
+          strength: 1.0
+      keep_checkpoints: 5
+      max_steps: 5000000
+      time_horizon: 1000
+      summary_freq: 30000
+  ```