ammr commited on Mar 5, 2023

Commit

efceb3b

1 Parent(s): 92f7f98

addsnowballtarget

Browse files

Files changed (18) hide show

SnowballTarget.onnx +1 -1
SnowballTarget/SnowballTarget-149984.onnx +1 -1
SnowballTarget/SnowballTarget-149984.pt +2 -2
SnowballTarget/SnowballTarget-199984.onnx +1 -1
SnowballTarget/SnowballTarget-199984.pt +2 -2
SnowballTarget/SnowballTarget-200112.onnx +1 -1
SnowballTarget/SnowballTarget-200112.pt +2 -2
SnowballTarget/SnowballTarget-49936.onnx +1 -1
SnowballTarget/SnowballTarget-49936.pt +2 -2
SnowballTarget/SnowballTarget-99960.onnx +1 -1
SnowballTarget/SnowballTarget-99960.pt +2 -2
SnowballTarget/checkpoint.pt +2 -2
SnowballTarget/{events.out.tfevents.1678034901.8cac745c4078.2553.0 → events.out.tfevents.1678035795.8cac745c4078.6559.0} +2 -2
config.json +1 -1
configuration.yaml +2 -2
run_logs/Player-0.log +14 -17
run_logs/timers.json +123 -123
run_logs/training_status.json +12 -12

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7688d35c2dc6fabec5fa481d56b6f4a4d4713593cd09e2979228a30555cc02fa
 size 645119

 version https://git-lfs.github.com/spec/v1
+oid sha256:a211d604995ede8e5eb3cb3dc9eca2fc377a51dc8c7a0bec2dac53dbde9ba7ea
 size 645119

SnowballTarget/SnowballTarget-149984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:54d10f6e4d97876a949f61936c87067e42e6dbcc3519e8923e0add06d781b87c
 size 645119

 version https://git-lfs.github.com/spec/v1
+oid sha256:76b03b4504c8ed32c0533476fa9f10339f51d93753a89ecec00350dbbb0ae94c
 size 645119

SnowballTarget/SnowballTarget-149984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1d16ba23efccce3105b9ae99fd14991d851e67afb031802a507a00e256233480
-size 3845585

 version https://git-lfs.github.com/spec/v1
+oid sha256:b6863ee3eb2886586a35d004afdadfe2e8f95d41a994016fac30da9a4c8b2303
+size 3845582

SnowballTarget/SnowballTarget-199984.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7688d35c2dc6fabec5fa481d56b6f4a4d4713593cd09e2979228a30555cc02fa
 size 645119

 version https://git-lfs.github.com/spec/v1
+oid sha256:a211d604995ede8e5eb3cb3dc9eca2fc377a51dc8c7a0bec2dac53dbde9ba7ea
 size 645119

SnowballTarget/SnowballTarget-199984.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:921e326b221b147dc85de42abbead1b3f03d7dd36e2c2aff25ac4ad430a33605
-size 3845585

 version https://git-lfs.github.com/spec/v1
+oid sha256:5fee661f793dde6360db1caf33a80112d384cc65fa399cdac6263bf126eed5e9
+size 3845582

SnowballTarget/SnowballTarget-200112.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7688d35c2dc6fabec5fa481d56b6f4a4d4713593cd09e2979228a30555cc02fa
 size 645119

 version https://git-lfs.github.com/spec/v1
+oid sha256:a211d604995ede8e5eb3cb3dc9eca2fc377a51dc8c7a0bec2dac53dbde9ba7ea
 size 645119

SnowballTarget/SnowballTarget-200112.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6e6f8fce3dae6b9d1dd3039c6b6c099e522368853231d080a37ff2fdd388de8e
-size 3845585

 version https://git-lfs.github.com/spec/v1
+oid sha256:c9ad410d79b14e251b5abbac09fcb4481d8f3b610854dbccaa6469f3d8157ece
+size 3845582

SnowballTarget/SnowballTarget-49936.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2a52d2705ada8fbcb9f2b2355542276b1bd047bab31eeeae793e4a63b4ba325d
 size 645119

 version https://git-lfs.github.com/spec/v1
+oid sha256:9ed1406acad3dda42b20ecfedd83635034b8bf20d4250df62f88912f36b30b0f
 size 645119

SnowballTarget/SnowballTarget-49936.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:191e78985f7b61cb795b71c0391ce9ae9add0efd582c111c5d716072d45c4a72
-size 3845585

 version https://git-lfs.github.com/spec/v1
+oid sha256:bf5eb4d22c768e920ebfcdef67356d281fdde2d3596dbbe42e2cfda20f2adbfe
+size 3845582

SnowballTarget/SnowballTarget-99960.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:078d8d4345a97fe7b6f043a3362303a15646741ea2469c5ca21c52d807ae5146
 size 645119

 version https://git-lfs.github.com/spec/v1
+oid sha256:3f0cced6ea41fcd181a20bdbcc43f2277106036f9664f7f2a88b928dcd800adb
 size 645119

SnowballTarget/SnowballTarget-99960.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7a4d297d3c2bb4955e09e74d8f0c90b44f9239fe456d4e1dcc86b154b85c79a0
-size 3845585

 version https://git-lfs.github.com/spec/v1
+oid sha256:cdf3fa39891ac28aa9860325dae393a45d4031e9a831f3357bac86d51d3329cb
+size 3845582

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6e6f8fce3dae6b9d1dd3039c6b6c099e522368853231d080a37ff2fdd388de8e
-size 3845585

 version https://git-lfs.github.com/spec/v1
+oid sha256:c9ad410d79b14e251b5abbac09fcb4481d8f3b610854dbccaa6469f3d8157ece
+size 3845582

SnowballTarget/{events.out.tfevents.1678034901.8cac745c4078.2553.0 → events.out.tfevents.1678035795.8cac745c4078.6559.0} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:84e21d3a97625d99e4366a384caa1cfde2fd7d6edb803a0954d5a71964ce5272
-size 39554

 version https://git-lfs.github.com/spec/v1
+oid sha256:433036b92a5b8a3bbfb9ee98dcd635b00d3f6a6cd8bb47de3c1823f6ca0a9843
+size 24633

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0001, "beta": 0.005, "epsilon": 0.1, "lambd": 0.95, "num_epoch": 3, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "checkpoint_interval": 50000, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": ~~false~~, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0001, "beta": 0.005, "epsilon": 0.1, "lambd": 0.95, "num_epoch": 5, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "checkpoint_interval": 50000, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": true, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -9,7 +9,7 @@ behaviors:
       beta: 0.005
       epsilon: 0.1
       lambd: 0.95
-      num_epoch: 3
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
@@ -66,7 +66,7 @@ checkpoint_settings:
   initialize_from: null
   load_model: false
   resume: false
-  force: false
   train_model: false
   inference: false
   results_dir: results

       beta: 0.005
       epsilon: 0.1
       lambd: 0.95
+      num_epoch: 5
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
   initialize_from: null
   load_model: false
   resume: false
+  force: true
   train_model: false
   inference: false
   results_dir: results

run_logs/Player-0.log CHANGED Viewed

@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
-Unable to load player prefs
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2642:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.081 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.759932 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -53,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 5369 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -169,22 +166,22 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 41
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 6.8 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 17.7 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -213,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 3616 frames, [64.0 KB-128.0 KB]: 1845 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 67.3 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -231,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5461 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5460 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -249,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.082 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.642188 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 5371 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 44
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 7.2 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.4 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 3766 frames, [64.0 KB-128.0 KB]: 1697 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 67.3 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 5463 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5463 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 5462 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 5463 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 5463 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,15 +2,15 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 1.685312271118164,
-            "min": 1.685312271118164,
-            "max": 2.8890349864959717,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 16091.361328125,
-            "min": 16091.361328125,
-            "max": 29632.33984375,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
@@ -26,15 +26,15 @@
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 7.907293319702148,
-            "min": 0.351300984621048,
-            "max": 7.907293319702148,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 1541.9222412109375,
-            "min": 68.15238952636719,
-            "max": 1584.873046875,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
@@ -44,45 +44,45 @@
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
-            "value": 8756.0,
             "min": 8756.0,
             "max": 10945.0,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.07125410158957547,
-            "min": 0.06425344648853164,
-            "max": 0.0730682620646714,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.2850164063583019,
-            "min": 0.26552707483129134,
-            "max": 0.35840099343263054,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.2702636673462157,
-            "min": 0.11407628148456342,
-            "max": 0.2871631226118873,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 1.0810546693848628,
-            "min": 0.4563051259382537,
-            "max": 1.395462342337066,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 2.6940973060000025e-06,
-            "min": 2.6940973060000025e-06,
-            "max": 9.729400270599998e-05,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 1.077638922400001e-05,
-            "min": 1.077638922400001e-05,
-            "max": 0.0004617200382800001,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
@@ -100,7 +100,7 @@
         "SnowballTarget.Policy.Beta.mean": {
             "value": 0.0001444306000000001,
             "min": 0.0001444306000000001,
-            "max": 0.0048649706,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
@@ -110,27 +110,27 @@
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 15.727272727272727,
-            "min": 3.4318181818181817,
-            "max": 15.727272727272727,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 692.0,
-            "min": 151.0,
-            "max": 861.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 15.727272727272727,
-            "min": 3.4318181818181817,
-            "max": 15.727272727272727,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 692.0,
-            "min": 151.0,
-            "max": 861.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
@@ -148,74 +148,74 @@
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1678034896",
         "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "0.29.0.dev0",
         "mlagents_envs_version": "0.29.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.8.1+cu102",
         "numpy_version": "1.22.4",
-        "end_time_seconds": "1678035381"
     },
-    "total": 485.3557066640001,
     "count": 1,
-    "self": 0.4400539790001403,
     "children": {
         "run_training.setup": {
-            "total": 0.11385373099994922,
             "count": 1,
-            "self": 0.11385373099994922
         },
         "TrainerController.start_learning": {
-            "total": 484.801798954,
             "count": 1,
-            "self": 0.526533777004488,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 8.997876354000027,
                     "count": 1,
-                    "self": 8.997876354000027
                 },
                 "TrainerController.advance": {
-                    "total": 475.1535011999955,
-                    "count": 18202,
-                    "self": 0.2930334490002906,
                     "children": {
                         "env_step": {
-                            "total": 474.8604677509952,
-                            "count": 18202,
-                            "self": 329.5822962359972,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 144.98736872400502,
-                                    "count": 18202,
-                                    "self": 1.5943377219991817,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 143.39303100200584,
-                                            "count": 18202,
-                                            "self": 30.800351743011106,
                                             "children": {
                                                 "TorchPolicy.sample_actions": {
-                                                    "total": 112.59267925899474,
-                                                    "count": 18202,
-                                                    "self": 112.59267925899474
                                                 }
                                             }
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.29080279099298423,
-                                    "count": 18202,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 483.2114098329995,
-                                            "count": 18202,
                                             "is_parallel": true,
-                                            "self": 235.90436944599878,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -224,48 +224,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.004791222000108064,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0023365290002175243,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.00245469299989054,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00245469299989054
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.09479242999998405,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0007890579998957037,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.00041478599996480625,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00041478599996480625
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.09181369500004166,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.09181369500004166
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.0017748910000818796,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0003955619999942428,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0013793290000876368,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0013793290000876368
                                                                         }
                                                                     }
                                                                 }
@@ -274,34 +274,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 247.3070403870007,
-                                                    "count": 18201,
                                                     "is_parallel": true,
-                                                    "self": 10.13541609801348,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 5.630104869000434,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 5.630104869000434
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 197.8231598699938,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 197.8231598699938
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 33.71835954999301,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 7.330036332977329,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 26.38832321701568,
-                                                                    "count": 182010,
                                                                     "is_parallel": true,
-                                                                    "self": 26.38832321701568
                                                                 }
                                                             }
                                                         }
@@ -316,9 +316,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 0.00011577300006138103,
                     "count": 1,
-                    "self": 0.00011577300006138103,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -327,36 +327,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 471.5583716319643,
-                                    "count": 409011,
                                     "is_parallel": true,
-                                    "self": 10.690392025921142,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 269.77555193804415,
-                                            "count": 409011,
                                             "is_parallel": true,
-                                            "self": 268.480037919044,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
-                                                    "total": 1.2955140190001657,
                                                     "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 1.2955140190001657
                                                 }
                                             }
                                         },
                                         "_update_policy": {
-                                            "total": 191.092427667999,
                                             "count": 90,
                                             "is_parallel": true,
-                                            "self": 66.223011674997,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 124.86941599300201,
-                                                    "count": 4587,
                                                     "is_parallel": true,
-                                                    "self": 124.86941599300201
                                                 }
                                             }
                                         }
@@ -367,14 +367,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.12377184999991186,
                     "count": 1,
-                    "self": 0.001011028999755581,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.12276082100015628,
                             "count": 1,
-                            "self": 0.12276082100015628
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 1.4694273471832275,
+            "min": 1.4694273471832275,
+            "max": 2.877119541168213,
             "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 14110.9111328125,
+            "min": 14110.9111328125,
+            "max": 29559.52734375,
             "count": 20
         },
         "SnowballTarget.Step.mean": {
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 9.996574401855469,
+            "min": 0.37617459893226624,
+            "max": 9.996574401855469,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 1949.33203125,
+            "min": 72.97787475585938,
+            "max": 2004.43212890625,
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
+            "value": 10945.0,
             "min": 8756.0,
             "max": 10945.0,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.06617252733507056,
+            "min": 0.06253673741004925,
+            "max": 0.07420266700329889,
             "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.26469010934028225,
+            "min": 0.250146949640197,
+            "max": 0.3511263588024603,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.2408758353222819,
+            "min": 0.11121187233982388,
+            "max": 0.26978057647452636,
             "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.9635033412891276,
+            "min": 0.4448474893592955,
+            "max": 1.3489028823726317,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 2.6940973060000016e-06,
+            "min": 2.6940973060000016e-06,
+            "max": 9.729400270600002e-05,
             "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 1.0776389224000007e-05,
+            "min": 1.0776389224000007e-05,
+            "max": 0.00046172003828000015,
             "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
         "SnowballTarget.Policy.Beta.mean": {
             "value": 0.0001444306000000001,
             "min": 0.0001444306000000001,
+            "max": 0.004864970599999999,
             "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 19.886363636363637,
+            "min": 2.8636363636363638,
+            "max": 19.886363636363637,
             "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 875.0,
+            "min": 126.0,
+            "max": 1091.0,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 19.886363636363637,
+            "min": 2.8636363636363638,
+            "max": 19.886363636363637,
             "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 875.0,
+            "min": 126.0,
+            "max": 1091.0,
             "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1678035791",
         "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --force",
         "mlagents_version": "0.29.0.dev0",
         "mlagents_envs_version": "0.29.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.8.1+cu102",
         "numpy_version": "1.22.4",
+        "end_time_seconds": "1678036335"
     },
+    "total": 543.5649645139999,
     "count": 1,
+    "self": 0.785157985000069,
     "children": {
         "run_training.setup": {
+            "total": 0.10759228999995685,
             "count": 1,
+            "self": 0.10759228999995685
         },
         "TrainerController.start_learning": {
+            "total": 542.6722142389999,
             "count": 1,
+            "self": 0.5381760530101474,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 6.928671871999995,
                     "count": 1,
+                    "self": 6.928671871999995
                 },
                 "TrainerController.advance": {
+                    "total": 534.9940004429898,
+                    "count": 18210,
+                    "self": 0.27205131597474974,
                     "children": {
                         "env_step": {
+                            "total": 534.721949127015,
+                            "count": 18210,
+                            "self": 385.2726056480435,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 149.1597922129954,
+                                    "count": 18210,
+                                    "self": 1.5831741370018335,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 147.57661807599357,
+                                            "count": 18210,
+                                            "self": 32.80984432500395,
                                             "children": {
                                                 "TorchPolicy.sample_actions": {
+                                                    "total": 114.76677375098961,
+                                                    "count": 18210,
+                                                    "self": 114.76677375098961
                                                 }
                                             }
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.28955126597611525,
+                                    "count": 18210,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 541.0359419470033,
+                                            "count": 18210,
                                             "is_parallel": true,
+                                            "self": 291.9733024630241,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.0022754120000172406,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0007699310003772553,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0015054809996399854,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0015054809996399854
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.05132571000012831,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0006334280001283332,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.0004171319999386469,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0004171319999386469
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.04818544599993402,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.04818544599993402
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0020897040001273126,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0005734110000048531,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0015162930001224595,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0015162930001224595
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 249.06263948397918,
+                                                    "count": 18209,
                                                     "is_parallel": true,
+                                                    "self": 9.97293427995669,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 5.687937014006593,
+                                                            "count": 18209,
                                                             "is_parallel": true,
+                                                            "self": 5.687937014006593
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 199.5349575030209,
+                                                            "count": 18209,
                                                             "is_parallel": true,
+                                                            "self": 199.5349575030209
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 33.866810686994995,
+                                                            "count": 18209,
                                                             "is_parallel": true,
+                                                            "self": 7.550632629977827,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 26.31617805701717,
+                                                                    "count": 182090,
                                                                     "is_parallel": true,
+                                                                    "self": 26.31617805701717
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 0.00013248899995232932,
                     "count": 1,
+                    "self": 0.00013248899995232932,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 531.2292537309627,
+                                    "count": 410466,
                                     "is_parallel": true,
+                                    "self": 11.0115854399196,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 271.62298273604074,
+                                            "count": 410466,
                                             "is_parallel": true,
+                                            "self": 270.561674838041,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
+                                                    "total": 1.061307897999768,
                                                     "count": 4,
                                                     "is_parallel": true,
+                                                    "self": 1.061307897999768
                                                 }
                                             }
                                         },
                                         "_update_policy": {
+                                            "total": 248.59468555500234,
                                             "count": 90,
                                             "is_parallel": true,
+                                            "self": 97.310092754994,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 151.28459280000834,
+                                                    "count": 7645,
                                                     "is_parallel": true,
+                                                    "self": 151.28459280000834
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.21123338200004582,
                     "count": 1,
+                    "self": 0.002096945999937816,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.209136436000108,
                             "count": 1,
+                            "self": 0.209136436000108
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -4,8 +4,8 @@
             {
                 "steps": 49936,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 9.090909090909092,
-                "creation_time": 1678035026.4217668,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
                 ]
@@ -13,8 +13,8 @@
             {
                 "steps": 99960,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 12.636363636363637,
-                "creation_time": 1678035146.9150894,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
                 ]
@@ -22,8 +22,8 @@
             {
                 "steps": 149984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
-                "reward": 15.909090909090908,
-                "creation_time": 1678035265.6009245,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
                 ]
@@ -31,8 +31,8 @@
             {
                 "steps": 199984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
-                "reward": 15.636363636363637,
-                "creation_time": 1678035381.3155072,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
                 ]
@@ -40,8 +40,8 @@
             {
                 "steps": 200112,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
-                "reward": 15.636363636363637,
-                "creation_time": 1678035381.4671304,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
@@ -50,8 +50,8 @@
         "final_checkpoint": {
             "steps": 200112,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 15.636363636363637,
-            "creation_time": 1678035381.4671304,
             "auxillary_file_paths": [
                 "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]

             {
                 "steps": 49936,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
+                "reward": 9.0,
+                "creation_time": 1678035931.8002622,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
                 ]
             {
                 "steps": 99960,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
+                "reward": 16.09090909090909,
+                "creation_time": 1678036066.813796,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
                 ]
             {
                 "steps": 149984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 16.181818181818183,
+                "creation_time": 1678036201.2113643,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
                 ]
             {
                 "steps": 199984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
+                "reward": 19.636363636363637,
+                "creation_time": 1678036334.4560852,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
                 ]
             {
                 "steps": 200112,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": 19.636363636363637,
+                "creation_time": 1678036334.7086399,
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
         "final_checkpoint": {
             "steps": 200112,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 19.636363636363637,
+            "creation_time": 1678036334.7086399,
             "auxillary_file_paths": [
                 "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]