First Push

Browse files

Files changed (4) hide show

config.json +1 -1
configuration.yaml +2 -0
run_logs/timers.json +20 -350
run_logs/training_status.json +2 -60

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -50,6 +50,7 @@ env_settings:
   base_port: 5005
   num_envs: 1
   num_areas: 1
   seed: -1
   max_lifetime_restarts: 10
   restarts_rate_limit_n: 1
@@ -62,6 +63,7 @@ engine_settings:
   target_frame_rate: -1
   capture_frame_rate: 60
   no_graphics: true
 environment_parameters: null
 checkpoint_settings:
   run_id: SnowballTarget1

   base_port: 5005
   num_envs: 1
   num_areas: 1
+  timeout_wait: 60
   seed: -1
   max_lifetime_restarts: 10
   restarts_rate_limit_n: 1
   target_frame_rate: -1
   capture_frame_rate: 60
   no_graphics: true
+  no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
   run_id: SnowballTarget1

run_logs/timers.json CHANGED Viewed

@@ -1,375 +1,45 @@
 {
     "name": "root",
-    "gauges": {
-        "SnowballTarget.Policy.Entropy.mean": {
-            "value": 0.9262873530387878,
-            "min": 0.9239082932472229,
-            "max": 2.8697240352630615,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Entropy.sum": {
-            "value": 8884.9482421875,
-            "min": 8884.9482421875,
-            "max": 29451.978515625,
-            "count": 20
-        },
-        "SnowballTarget.Step.mean": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
-        },
-        "SnowballTarget.Step.sum": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 12.910005569458008,
-            "min": 0.338864266872406,
-            "max": 12.910005569458008,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2517.451171875,
-            "min": 65.73966979980469,
-            "max": 2606.02783203125,
-            "count": 20
-        },
-        "SnowballTarget.Environment.EpisodeLength.mean": {
-            "value": 199.0,
-            "min": 199.0,
-            "max": 199.0,
-            "count": 20
-        },
-        "SnowballTarget.Environment.EpisodeLength.sum": {
-            "value": 10945.0,
-            "min": 8756.0,
-            "max": 10945.0,
-            "count": 20
-        },
-        "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.06521946081763827,
-            "min": 0.06160413643031942,
-            "max": 0.07541242198898294,
-            "count": 20
-        },
-        "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.2608778432705531,
-            "min": 0.2464165457212777,
-            "max": 0.3657878658222947,
-            "count": 20
-        },
-        "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.21077231748723516,
-            "min": 0.10733545933252053,
-            "max": 0.27753121256828306,
-            "count": 20
-        },
-        "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.8430892699489406,
-            "min": 0.42934183733008213,
-            "max": 1.3876560628414154,
-            "count": 20
-        },
-        "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 8.082097306000005e-06,
-            "min": 8.082097306000005e-06,
-            "max": 0.000291882002706,
-            "count": 20
-        },
-        "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 3.232838922400002e-05,
-            "min": 3.232838922400002e-05,
-            "max": 0.00138516003828,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.10269400000000001,
-            "min": 0.10269400000000001,
-            "max": 0.19729400000000002,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.41077600000000003,
-            "min": 0.41077600000000003,
-            "max": 0.96172,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Beta.mean": {
-            "value": 0.0001444306000000001,
-            "min": 0.0001444306000000001,
-            "max": 0.0048649706,
-            "count": 20
-        },
-        "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.0005777224000000004,
-            "min": 0.0005777224000000004,
-            "max": 0.023089828,
-            "count": 20
-        },
-        "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 25.863636363636363,
-            "min": 3.090909090909091,
-            "max": 25.863636363636363,
-            "count": 20
-        },
-        "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1138.0,
-            "min": 136.0,
-            "max": 1380.0,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 25.863636363636363,
-            "min": 3.090909090909091,
-            "max": 25.863636363636363,
-            "count": 20
-        },
-        "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1138.0,
-            "min": 136.0,
-            "max": 1380.0,
-            "count": 20
-        },
-        "SnowballTarget.IsTraining.mean": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 20
-        },
-        "SnowballTarget.IsTraining.sum": {
-            "value": 1.0,
-            "min": 1.0,
-            "max": 1.0,
-            "count": 20
-        }
-    },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1690710094",
-        "python_version": "3.10.6 (main, May 29 2023, 11:10:38) [GCC 11.3.0]",
-        "command_line_arguments": "/home/darth/MLAI-projects/unity_ML_env_rl/envunity/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
-        "mlagents_version": "0.31.0.dev0",
-        "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
-        "pytorch_version": "1.11.0+cu102",
-        "numpy_version": "1.21.2",
-        "end_time_seconds": "1690710395"
     },
-    "total": 301.2973983959964,
     "count": 1,
-    "self": 0.24279949300398584,
     "children": {
         "run_training.setup": {
-            "total": 0.012102430991944857,
             "count": 1,
-            "self": 0.012102430991944857
         },
         "TrainerController.start_learning": {
-            "total": 301.0424964720005,
             "count": 1,
-            "self": 0.4472816170891747,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 4.1457579050038476,
                     "count": 1,
-                    "self": 4.1457579050038476
-                },
-                "TrainerController.advance": {
-                    "total": 296.32677600091847,
-                    "count": 18205,
-                    "self": 0.21726975301862694,
-                    "children": {
-                        "env_step": {
-                            "total": 296.10950624789984,
-                            "count": 18205,
-                            "self": 210.70691560591513,
-                            "children": {
-                                "SubprocessEnvManager._take_step": {
-                                    "total": 85.17109143872221,
-                                    "count": 18205,
-                                    "self": 1.0946911648643436,
-                                    "children": {
-                                        "TorchPolicy.evaluate": {
-                                            "total": 84.07640027385787,
-                                            "count": 18205,
-                                            "self": 84.07640027385787
-                                        }
-                                    }
-                                },
-                                "workers": {
-                                    "total": 0.2314992032625014,
-                                    "count": 18205,
-                                    "self": 0.0,
-                                    "children": {
-                                        "worker_root": {
-                                            "total": 300.3939307623077,
-                                            "count": 18205,
-                                            "is_parallel": true,
-                                            "self": 167.06463586754398,
-                                            "children": {
-                                                "run_training.setup": {
-                                                    "total": 0.0,
-                                                    "count": 0,
-                                                    "is_parallel": true,
-                                                    "self": 0.0,
-                                                    "children": {
-                                                        "steps_from_proto": {
-                                                            "total": 0.001692421006737277,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.0004321349988458678,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.001260286007891409,
-                                                                    "count": 10,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.001260286007891409
-                                                                }
-                                                            }
-                                                        },
-                                                        "UnityEnvironment.step": {
-                                                            "total": 0.021032813005149364,
-                                                            "count": 1,
-                                                            "is_parallel": true,
-                                                            "self": 0.0003260369994677603,
-                                                            "children": {
-                                                                "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00021892199583817273,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.00021892199583817273
-                                                                },
-                                                                "communicator.exchange": {
-                                                                    "total": 0.01946014900750015,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.01946014900750015
-                                                                },
-                                                                "steps_from_proto": {
-                                                                    "total": 0.001027705002343282,
-                                                                    "count": 1,
-                                                                    "is_parallel": true,
-                                                                    "self": 0.00022556701151188463,
-                                                                    "children": {
-                                                                        "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0008021379908313975,
-                                                                            "count": 10,
-                                                                            "is_parallel": true,
-                                                                            "self": 0.0008021379908313975
-                                                                        }
-                                                                    }
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                },
-                                                "UnityEnvironment.step": {
-                                                    "total": 133.32929489476373,
-                                                    "count": 18204,
-                                                    "is_parallel": true,
-                                                    "self": 5.69056420630659,
-                                                    "children": {
-                                                        "UnityEnvironment._generate_step_input": {
-                                                            "total": 3.2870714761229465,
-                                                            "count": 18204,
-                                                            "is_parallel": true,
-                                                            "self": 3.2870714761229465
-                                                        },
-                                                        "communicator.exchange": {
-                                                            "total": 105.69360468778177,
-                                                            "count": 18204,
-                                                            "is_parallel": true,
-                                                            "self": 105.69360468778177
-                                                        },
-                                                        "steps_from_proto": {
-                                                            "total": 18.658054524552426,
-                                                            "count": 18204,
-                                                            "is_parallel": true,
-                                                            "self": 3.9579579753481084,
-                                                            "children": {
-                                                                "_process_rank_one_or_two_observation": {
-                                                                    "total": 14.700096549204318,
-                                                                    "count": 182040,
-                                                                    "is_parallel": true,
-                                                                    "self": 14.700096549204318
-                                                                }
-                                                            }
-                                                        }
-                                                    }
-                                                }
-                                            }
-                                        }
-                                    }
-                                }
-                            }
-                        }
-                    }
                 },
                 "trainer_threads": {
-                    "total": 0.00011076898954343051,
                     "count": 1,
-                    "self": 0.00011076898954343051,
-                    "children": {
-                        "thread_root": {
-                            "total": 0.0,
-                            "count": 0,
-                            "is_parallel": true,
-                            "self": 0.0,
-                            "children": {
-                                "trainer_advance": {
-                                    "total": 295.70782078724005,
-                                    "count": 220402,
-                                    "is_parallel": true,
-                                    "self": 2.8024480845488142,
-                                    "children": {
-                                        "process_trajectory": {
-                                            "total": 158.59546039077395,
-                                            "count": 220402,
-                                            "is_parallel": true,
-                                            "self": 157.94113994776853,
-                                            "children": {
-                                                "RLTrainer._checkpoint": {
-                                                    "total": 0.6543204430054175,
-                                                    "count": 4,
-                                                    "is_parallel": true,
-                                                    "self": 0.6543204430054175
-                                                }
-                                            }
-                                        },
-                                        "_update_policy": {
-                                            "total": 134.3099123119173,
-                                            "count": 90,
-                                            "is_parallel": true,
-                                            "self": 40.4545891147136,
-                                            "children": {
-                                                "TorchPPOOptimizer.update": {
-                                                    "total": 93.85532319720369,
-                                                    "count": 4587,
-                                                    "is_parallel": true,
-                                                    "self": 93.85532319720369
-                                                }
-                                            }
-                                        }
-                                    }
-                                }
-                            }
-                        }
-                    }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.12257017999945674,
                     "count": 1,
-                    "self": 0.0008117520046653226,
-                    "children": {
-                        "RLTrainer._checkpoint": {
-                            "total": 0.12175842799479142,
-                            "count": 1,
-                            "self": 0.12175842799479142
-                        }
-                    }
                 }
             }
         }

 {
     "name": "root",
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1705041622",
+        "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
+        "mlagents_version": "1.1.0.dev0",
+        "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
+        "pytorch_version": "2.1.2+cu121",
+        "numpy_version": "1.23.5",
+        "end_time_seconds": "1705041623"
     },
+    "total": 0.2293522939999093,
     "count": 1,
+    "self": 0.017557923999902414,
     "children": {
         "run_training.setup": {
+            "total": 0.06224575999999615,
             "count": 1,
+            "self": 0.06224575999999615
         },
         "TrainerController.start_learning": {
+            "total": 0.14954861000001074,
             "count": 1,
+            "self": 0.0004441789999418688,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 0.1490876269999717,
                     "count": 1,
+                    "self": 0.1490876269999717
                 },
                 "trainer_threads": {
+                    "total": 1.5450000319106039e-06,
                     "count": 1,
+                    "self": 1.5450000319106039e-06
                 },
                 "TrainerController._save_models": {
+                    "total": 1.525900006527081e-05,
                     "count": 1,
+                    "self": 1.525900006527081e-05
                 }
             }
         }

run_logs/training_status.json CHANGED Viewed

@@ -1,65 +1,7 @@
 {
-    "SnowballTarget": {
-        "checkpoints": [
-            {
-                "steps": 49936,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 11.181818181818182,
-                "creation_time": 1690710173.516804,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
-                ]
-            },
-            {
-                "steps": 99960,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 22.272727272727273,
-                "creation_time": 1690710247.6696513,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
-                ]
-            },
-            {
-                "steps": 149984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 23.454545454545453,
-                "creation_time": 1690710321.9218476,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
-                ]
-            },
-            {
-                "steps": 199984,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": 25.727272727272727,
-                "creation_time": 1690710395.0971208,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
-                ]
-            },
-            {
-                "steps": 200112,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
-                "reward": 25.727272727272727,
-                "creation_time": 1690710395.2414272,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
-                ]
-            }
-        ],
-        "final_checkpoint": {
-            "steps": 200112,
-            "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 25.727272727272727,
-            "creation_time": 1690710395.2414272,
-            "auxillary_file_paths": [
-                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
-            ]
-        }
-    },
     "metadata": {
         "stats_format_version": "0.3.0",
-        "mlagents_version": "0.31.0.dev0",
-        "torch_version": "1.11.0+cu102"
     }
 }

 {
     "metadata": {
         "stats_format_version": "0.3.0",
+        "mlagents_version": "1.1.0.dev0",
+        "torch_version": "2.1.2+cu121"
     }
 }