Tiru8055 commited on Jul 3, 2023

Commit

8adac6e

•

1 Parent(s): 11bf15b

First Push

Browse files

Files changed (22) hide show

SnowballTarget.onnx +1 -1
SnowballTarget/SnowballTarget-249984.onnx +3 -0
SnowballTarget/SnowballTarget-249984.pt +3 -0
SnowballTarget/SnowballTarget-299944.onnx +3 -0
SnowballTarget/SnowballTarget-299944.pt +3 -0
SnowballTarget/SnowballTarget-349968.onnx +3 -0
SnowballTarget/SnowballTarget-349968.pt +3 -0
SnowballTarget/SnowballTarget-399968.onnx +3 -0
SnowballTarget/SnowballTarget-399968.pt +3 -0
SnowballTarget/SnowballTarget-449992.onnx +3 -0
SnowballTarget/SnowballTarget-449992.pt +3 -0
SnowballTarget/SnowballTarget-499952.onnx +3 -0
SnowballTarget/SnowballTarget-499952.pt +3 -0
SnowballTarget/SnowballTarget-500016.onnx +3 -0
SnowballTarget/SnowballTarget-500016.pt +3 -0
SnowballTarget/checkpoint.pt +1 -1
SnowballTarget/events.out.tfevents.1688361359.ffe632322ea5.4780.0 +3 -0
config.json +1 -1
configuration.yaml +2 -2
run_logs/Player-0.log +15 -18
run_logs/timers.json +163 -163
run_logs/training_status.json +67 -22

SnowballTarget.onnx CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b840eb91a5e6521ef017585524401ec41e24cab99e94d3e2f1be467355c348ca
 size 646532

 version https://git-lfs.github.com/spec/v1
+oid sha256:72c21525d963aab9361932cffb61b8a8767d334705406fcf9767f2df700b08a0
 size 646532

SnowballTarget/SnowballTarget-249984.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a6f0f8e5ae31a0a6595b25e8c6195d399d87569ee606724398f3517ad05d018c
+size 646532

SnowballTarget/SnowballTarget-249984.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f98c0084b95ae84be8da3911149cac7918910a028f27415e5eb455510a2c5ed7
+size 3843968

SnowballTarget/SnowballTarget-299944.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d164e38db96fb304695415638d60910756c48dae64ad402a7e00f10d3ad1460
+size 646532

SnowballTarget/SnowballTarget-299944.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:655c05349b4b6d2cda393e519d73a48a7e3be912d6dc020d97da6083cc486a58
+size 3843968

SnowballTarget/SnowballTarget-349968.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af861557ca09811875b9d91dd0fdecea9b556d0cdcc1198c8ddf7ca8f47487bd
+size 646532

SnowballTarget/SnowballTarget-349968.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:0f4b5eccc602b2f9f84e77032890cbc87b83d01de3027ceb6771df10047ce363
+size 3843968

SnowballTarget/SnowballTarget-399968.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f48b50fec83dc37be9f17fa1f49aa6c9b16c210b23510857474952c79ee28fb3
+size 646532

SnowballTarget/SnowballTarget-399968.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d985d556ad2844ec0bb394114ad8b91398163067bb8533309fd2d0d6df124db
+size 3843968

SnowballTarget/SnowballTarget-449992.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2ef875b5d499683b7604cb5f2797d9de9579c51ee6695c7cca0fceb0e358cae8
+size 646532

SnowballTarget/SnowballTarget-449992.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c6bef5845adfd0dc936c65a20315b42025bf5177e40efd354e14bcca78d2da82
+size 3843968

SnowballTarget/SnowballTarget-499952.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72c21525d963aab9361932cffb61b8a8767d334705406fcf9767f2df700b08a0
+size 646532

SnowballTarget/SnowballTarget-499952.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:974042f92d99a1ecfcd8df3683a461bff6b6ac465037a45734b45bc9c1972a9a
+size 3843968

SnowballTarget/SnowballTarget-500016.onnx ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:72c21525d963aab9361932cffb61b8a8767d334705406fcf9767f2df700b08a0
+size 646532

SnowballTarget/SnowballTarget-500016.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e2acd54b73a0c6d4799d4a2c3270d82771984e4ffa693b2dd453b4ac71173204
+size 3843968

SnowballTarget/checkpoint.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9e8a2c04ceb9f4f0f2f753eeac84944fe31f1afe0c03fe7536dc74bd176d2676
 size 3843968

 version https://git-lfs.github.com/spec/v1
+oid sha256:e2acd54b73a0c6d4799d4a2c3270d82771984e4ffa693b2dd453b4ac71173204
 size 3843968

SnowballTarget/events.out.tfevents.1688361359.ffe632322ea5.4780.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7adb75a5e8cc3fcfd524dac7a219a83a9e41a4eade6a857678fae3b2751392f9
+size 25630

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": ~~200000~~, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": ~~false~~, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 500000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -38,7 +38,7 @@ behaviors:
     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
-    max_steps: 200000
     time_horizon: 64
     summary_freq: 10000
     threaded: true
@@ -67,7 +67,7 @@ checkpoint_settings:
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
-  resume: false
   force: false
   train_model: false
   inference: false

     init_path: null
     keep_checkpoints: 10
     even_checkpoints: false
+    max_steps: 500000
     time_horizon: 64
     summary_freq: 10000
     threaded: true
   run_id: SnowballTarget1
   initialize_from: null
   load_model: false
+  resume: true
   force: false
   train_model: false
   inference: false

run_logs/Player-0.log CHANGED Viewed

@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/training-envs-executables/linux/SnowballTarge
 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
-PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/SnowballTarget
-Unable to load player prefs
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2642:(snd_pcm_open_noupdate) Unknown PCM default
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
-- Completed reload, in  0.092 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -45,7 +42,7 @@ ERROR: Shader Standard shader is not supported on this GPU (none of subshaders/f
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
-UnloadTime: 0.814693 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
@@ -53,7 +50,7 @@ Memory Statistics:
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
-      Peak usage frame count: [8.0 KB-16.0 KB]: 5369 frames, [16.0 KB-32.0 KB]: 91 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
@@ -169,22 +166,22 @@ Memory Statistics:
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
-  Peak main deferred allocation count 41
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
-      Peak usage frame count: [4.0 MB-8.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 6.8 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
-      Peak usage frame count: [16.0 MB-32.0 MB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 17.6 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
@@ -213,13 +210,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 4802 frames, [64.0 KB-128.0 KB]: 659 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
-      Peak Allocated memory 66.4 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
-      Peak usage frame count: [32.0 KB-64.0 KB]: 5461 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
@@ -231,13 +228,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5461 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
-      Peak usage frame count: [0.5 MB-1.0 MB]: 5460 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
@@ -249,13 +246,13 @@ Memory Statistics:
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
-      Peak usage frame count: [0-1.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
-      Peak usage frame count: [1.0 KB-2.0 KB]: 5461 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

 Mono config path = '/content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/MonoBleedingEdge/etc'
 Preloaded 'lib_burst_generated.so'
 Preloaded 'libgrpc_csharp_ext.x64.so'
 Initialize engine version: 2021.3.14f1 (eee1884e7226)
 [Subsystems] Discovering subsystems at path /content/ml-agents/training-envs-executables/linux/SnowballTarget/SnowballTarget_Data/UnitySubsystems
 Forcing GfxDevice: Null
 FMOD failed to initialize the output device.: "Error initializing output device. " (60)
 FMOD initialized on nosound output
 Begin MonoManager ReloadAssembly
+- Completed reload, in  0.080 seconds
 ERROR: Shader Sprites/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Sprites/Mask shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 ERROR: Shader Legacy Shaders/VertexLit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 WARNING: Shader Unsupported: 'Standard' - All subshaders removed
 WARNING: Shader Did you use #pragma only_renderers and omit this platform?
 WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
+UnloadTime: 0.723080 ms
 ERROR: Shader UI/Default shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 requesting resize 84 x 84
 Setting up 1 worker threads for Enlighten.
 [ALLOC_TEMP_TLS] TLS Allocator
   StackAllocators :
     [ALLOC_TEMP_MAIN]
+      Peak usage frame count: [8.0 KB-16.0 KB]: 8046 frames, [16.0 KB-32.0 KB]: 136 frames, [2.0 MB-4.0 MB]: 1 frames
       Initial Block Size 4.0 MB
       Current Block Size 4.0 MB
       Peak Allocated Bytes 2.0 MB
       Peak Allocated Bytes 0 B
       Overflow Count 0
 [ALLOC_DEFAULT] Dual Thread Allocator
+  Peak main deferred allocation count 37
     [ALLOC_BUCKET]
       Large Block size 4.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_DEFAULT_MAIN]
+      Peak usage frame count: [4.0 MB-8.0 MB]: 8183 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 7.8 MB
       Peak Large allocation bytes 0 B
     [ALLOC_DEFAULT_THREAD]
+      Peak usage frame count: [16.0 MB-32.0 MB]: 8183 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 17.5 MB
       Peak Large allocation bytes 16.0 MB
 [ALLOC_TEMP_JOB_1_FRAME]
   Initial Block Size 2.0 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_GFX_MAIN]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 7994 frames, [64.0 KB-128.0 KB]: 189 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
+      Peak Allocated memory 66.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_GFX_THREAD]
+      Peak usage frame count: [32.0 KB-64.0 KB]: 8183 frames
       Requested Block Size 16.0 MB
       Peak Block count 1
       Peak Allocated memory 39.6 KB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_CACHEOBJECTS_MAIN]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 8183 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 0.6 MB
       Peak Large allocation bytes 0 B
     [ALLOC_CACHEOBJECTS_THREAD]
+      Peak usage frame count: [0.5 MB-1.0 MB]: 8182 frames, [2.0 MB-4.0 MB]: 1 frames
       Requested Block Size 4.0 MB
       Peak Block count 1
       Peak Allocated memory 2.2 MB
       Used Block count 1
       Peak Allocated bytes 1.0 MB
     [ALLOC_TYPETREE_MAIN]
+      Peak usage frame count: [0-1.0 KB]: 8183 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.0 KB
       Peak Large allocation bytes 0 B
     [ALLOC_TYPETREE_THREAD]
+      Peak usage frame count: [1.0 KB-2.0 KB]: 8183 frames
       Requested Block Size 2.0 MB
       Peak Block count 1
       Peak Allocated memory 1.7 KB

run_logs/timers.json CHANGED Viewed

@@ -2,213 +2,213 @@
     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
-            "value": 0.8457798361778259,
-            "min": 0.8457798361778259,
-            "max": 2.8563437461853027,
-            "count": 20
         },
         "SnowballTarget.Policy.Entropy.sum": {
-            "value": 8094.11279296875,
-            "min": 8094.11279296875,
-            "max": 29251.81640625,
-            "count": 20
         },
         "SnowballTarget.Step.mean": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
         },
         "SnowballTarget.Step.sum": {
-            "value": 199984.0,
-            "min": 9952.0,
-            "max": 199984.0,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
-            "value": 12.897496223449707,
-            "min": 0.4525079131126404,
-            "max": 12.897496223449707,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
-            "value": 2515.01171875,
-            "min": 87.78653717041016,
-            "max": 2620.910888671875,
-            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
-            "count": 20
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
-            "value": 8756.0,
             "min": 8756.0,
             "max": 10945.0,
-            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
-            "value": 0.0660408986672444,
-            "min": 0.06202504008458573,
-            "max": 0.07594248190694534,
-            "count": 20
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
-            "value": 0.2641635946689776,
-            "min": 0.24810016033834292,
-            "max": 0.37971240953472674,
-            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
-            "value": 0.20833415198413763,
-            "min": 0.11108574133672222,
-            "max": 0.2736487640469682,
-            "count": 20
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
-            "value": 0.8333366079365505,
-            "min": 0.4443429653468889,
-            "max": 1.368243820234841,
-            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.mean": {
-            "value": 8.082097306000005e-06,
-            "min": 8.082097306000005e-06,
-            "max": 0.000291882002706,
-            "count": 20
         },
         "SnowballTarget.Policy.LearningRate.sum": {
-            "value": 3.232838922400002e-05,
-            "min": 3.232838922400002e-05,
-            "max": 0.00138516003828,
-            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.mean": {
-            "value": 0.10269400000000001,
-            "min": 0.10269400000000001,
-            "max": 0.19729400000000002,
-            "count": 20
         },
         "SnowballTarget.Policy.Epsilon.sum": {
-            "value": 0.41077600000000003,
-            "min": 0.41077600000000003,
-            "max": 0.96172,
-            "count": 20
         },
         "SnowballTarget.Policy.Beta.mean": {
-            "value": 0.0001444306000000001,
-            "min": 0.0001444306000000001,
-            "max": 0.0048649706,
-            "count": 20
         },
         "SnowballTarget.Policy.Beta.sum": {
-            "value": 0.0005777224000000004,
-            "min": 0.0005777224000000004,
-            "max": 0.023089828,
-            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
-            "value": 25.613636363636363,
-            "min": 3.8181818181818183,
-            "max": 25.727272727272727,
-            "count": 20
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
-            "value": 1127.0,
-            "min": 168.0,
-            "max": 1399.0,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
-            "value": 25.613636363636363,
-            "min": 3.8181818181818183,
-            "max": 25.727272727272727,
-            "count": 20
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
-            "value": 1127.0,
-            "min": 168.0,
-            "max": 1399.0,
-            "count": 20
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 20
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
-            "count": 20
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1688360621",
         "python_version": "3.10.12 (main, Jun  7 2023, 12:45:35) [GCC 9.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
-        "end_time_seconds": "1688361122"
     },
-    "total": 500.95074694299996,
     "count": 1,
-    "self": 0.4364345719999392,
     "children": {
         "run_training.setup": {
-            "total": 0.042037476000018614,
             "count": 1,
-            "self": 0.042037476000018614
         },
         "TrainerController.start_learning": {
-            "total": 500.472274895,
             "count": 1,
-            "self": 0.617950017999874,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 4.689369449000026,
                     "count": 1,
-                    "self": 4.689369449000026
                 },
                 "TrainerController.advance": {
-                    "total": 495.0138066100002,
-                    "count": 18202,
-                    "self": 0.31194189099733194,
                     "children": {
                         "env_step": {
-                            "total": 494.70186471900286,
-                            "count": 18202,
-                            "self": 359.99233726200856,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
-                                    "total": 134.41122841800131,
-                                    "count": 18202,
-                                    "self": 1.976198901999112,
                                     "children": {
                                         "TorchPolicy.evaluate": {
-                                            "total": 132.4350295160022,
-                                            "count": 18202,
-                                            "self": 132.4350295160022
                                         }
                                     }
                                 },
                                 "workers": {
-                                    "total": 0.2982990389929796,
-                                    "count": 18202,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
-                                            "total": 498.73344575299967,
-                                            "count": 18202,
                                             "is_parallel": true,
-                                            "self": 231.1729418770006,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
@@ -217,48 +217,48 @@
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
-                                                            "total": 0.005294972000001508,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.003601630999980898,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 0.0016933410000206095,
                                                                     "count": 10,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0016933410000206095
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
-                                                            "total": 0.09222192999999379,
                                                             "count": 1,
                                                             "is_parallel": true,
-                                                            "self": 0.0006798279999884471,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
-                                                                    "total": 0.0003048659999649317,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.0003048659999649317
                                                                 },
                                                                 "communicator.exchange": {
-                                                                    "total": 0.08895729800002528,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.08895729800002528
                                                                 },
                                                                 "steps_from_proto": {
-                                                                    "total": 0.002279938000015136,
                                                                     "count": 1,
                                                                     "is_parallel": true,
-                                                                    "self": 0.00038622200003146645,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
-                                                                            "total": 0.0018937159999836695,
                                                                             "count": 10,
                                                                             "is_parallel": true,
-                                                                            "self": 0.0018937159999836695
                                                                         }
                                                                     }
                                                                 }
@@ -267,34 +267,34 @@
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
-                                                    "total": 267.5605038759991,
-                                                    "count": 18201,
                                                     "is_parallel": true,
-                                                    "self": 11.011050943994746,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
-                                                            "total": 5.68991407300183,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 5.68991407300183
                                                         },
                                                         "communicator.exchange": {
-                                                            "total": 212.22475883100407,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 212.22475883100407
                                                         },
                                                         "steps_from_proto": {
-                                                            "total": 38.63478002799843,
-                                                            "count": 18201,
                                                             "is_parallel": true,
-                                                            "self": 7.204467238008817,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
-                                                                    "total": 31.430312789989614,
-                                                                    "count": 182010,
                                                                     "is_parallel": true,
-                                                                    "self": 31.430312789989614
                                                                 }
                                                             }
                                                         }
@@ -309,9 +309,9 @@
                     }
                 },
                 "trainer_threads": {
-                    "total": 9.930499993515696e-05,
                     "count": 1,
-                    "self": 9.930499993515696e-05,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
@@ -320,36 +320,36 @@
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
-                                    "total": 491.19399326699875,
-                                    "count": 468403,
                                     "is_parallel": true,
-                                    "self": 10.452562230021385,
                                     "children": {
                                         "process_trajectory": {
-                                            "total": 270.97192971297744,
-                                            "count": 468403,
                                             "is_parallel": true,
-                                            "self": 269.57651628297737,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
-                                                    "total": 1.395413430000076,
-                                                    "count": 4,
                                                     "is_parallel": true,
-                                                    "self": 1.395413430000076
                                                 }
                                             }
                                         },
                                         "_update_policy": {
-                                            "total": 209.76950132399992,
-                                            "count": 90,
                                             "is_parallel": true,
-                                            "self": 80.41273413999949,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
-                                                    "total": 129.35676718400043,
-                                                    "count": 4584,
                                                     "is_parallel": true,
-                                                    "self": 129.35676718400043
                                                 }
                                             }
                                         }
@@ -360,14 +360,14 @@
                     }
                 },
                 "TrainerController._save_models": {
-                    "total": 0.15104951299997538,
                     "count": 1,
-                    "self": 0.0008534070000223437,
                     "children": {
                         "RLTrainer._checkpoint": {
-                            "total": 0.15019610599995303,
                             "count": 1,
-                            "self": 0.15019610599995303
                         }
                     }
                 }

     "name": "root",
     "gauges": {
         "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.5554143786430359,
+            "min": 0.5431214570999146,
+            "max": 0.8691041469573975,
+            "count": 30
         },
         "SnowballTarget.Policy.Entropy.sum": {
+            "value": 5351.97314453125,
+            "min": 5228.943359375,
+            "max": 8976.9765625,
+            "count": 30
         },
         "SnowballTarget.Step.mean": {
+            "value": 499952.0,
+            "min": 209936.0,
+            "max": 499952.0,
+            "count": 30
         },
         "SnowballTarget.Step.sum": {
+            "value": 499952.0,
+            "min": 209936.0,
+            "max": 499952.0,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 13.531689643859863,
+            "min": 12.990665435791016,
+            "max": 13.649582862854004,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2760.464599609375,
+            "min": 2494.838134765625,
+            "max": 2784.514892578125,
+            "count": 30
         },
         "SnowballTarget.Environment.EpisodeLength.mean": {
             "value": 199.0,
             "min": 199.0,
             "max": 199.0,
+            "count": 30
         },
         "SnowballTarget.Environment.EpisodeLength.sum": {
+            "value": 10945.0,
             "min": 8756.0,
             "max": 10945.0,
+            "count": 30
         },
         "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.0689360275408855,
+            "min": 0.06196786984219216,
+            "max": 0.08477714681004156,
+            "count": 30
         },
         "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.3446801377044275,
+            "min": 0.24787147936876863,
+            "max": 0.3776190985734894,
+            "count": 30
         },
         "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.17166311223717298,
+            "min": 0.1591150899801184,
+            "max": 0.21358135138072218,
+            "count": 30
         },
         "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.8583155611858649,
+            "min": 0.6364603599204736,
+            "max": 0.9760537848753088,
+            "count": 30
         },
         "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 3.1056989647999945e-06,
+            "min": 3.1056989647999945e-06,
+            "max": 0.00017668564110480002,
+            "count": 30
         },
         "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 1.5528494823999972e-05,
+            "min": 1.5528494823999972e-05,
+            "max": 0.000853728215424,
+            "count": 30
         },
         "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10103520000000002,
+            "min": 0.10103520000000002,
+            "max": 0.15889520000000001,
+            "count": 30
         },
         "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.5051760000000001,
+            "min": 0.4120608,
+            "max": 0.7845760000000002,
+            "count": 30
         },
         "SnowballTarget.Policy.Beta.mean": {
+            "value": 6.165647999999992e-05,
+            "min": 6.165647999999992e-05,
+            "max": 0.002948870480000001,
+            "count": 30
         },
         "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.0003082823999999996,
+            "min": 0.0003082823999999996,
+            "max": 0.0142503424,
+            "count": 30
         },
         "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 26.254545454545454,
+            "min": 25.072727272727274,
+            "max": 26.818181818181817,
+            "count": 30
         },
         "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1444.0,
+            "min": 1137.0,
+            "max": 1472.0,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 26.254545454545454,
+            "min": 25.072727272727274,
+            "max": 26.818181818181817,
+            "count": 30
         },
         "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1444.0,
+            "min": 1137.0,
+            "max": 1472.0,
+            "count": 30
         },
         "SnowballTarget.IsTraining.mean": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 30
         },
         "SnowballTarget.IsTraining.sum": {
             "value": 1.0,
             "min": 1.0,
             "max": 1.0,
+            "count": 30
         }
     },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1688361359",
         "python_version": "3.10.12 (main, Jun  7 2023, 12:45:35) [GCC 9.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics --resume",
         "mlagents_version": "0.31.0.dev0",
         "mlagents_envs_version": "0.31.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "1.11.0+cu102",
         "numpy_version": "1.21.2",
+        "end_time_seconds": "1688362084"
     },
+    "total": 725.1287801450001,
     "count": 1,
+    "self": 0.42301487899976564,
     "children": {
         "run_training.setup": {
+            "total": 0.03936998600011066,
             "count": 1,
+            "self": 0.03936998600011066
         },
         "TrainerController.start_learning": {
+            "total": 724.6663952800002,
             "count": 1,
+            "self": 0.8414607440045074,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 3.9242372219998742,
                     "count": 1,
+                    "self": 3.9242372219998742
                 },
                 "TrainerController.advance": {
+                    "total": 719.7430740599957,
+                    "count": 27274,
+                    "self": 0.42077153500281383,
                     "children": {
                         "env_step": {
+                            "total": 719.3223025249929,
+                            "count": 27274,
+                            "self": 524.3226615199812,
                             "children": {
                                 "SubprocessEnvManager._take_step": {
+                                    "total": 194.58223836600496,
+                                    "count": 27274,
+                                    "self": 2.794133769002201,
                                     "children": {
                                         "TorchPolicy.evaluate": {
+                                            "total": 191.78810459700276,
+                                            "count": 27274,
+                                            "self": 191.78810459700276
                                         }
                                     }
                                 },
                                 "workers": {
+                                    "total": 0.4174026390066956,
+                                    "count": 27274,
                                     "self": 0.0,
                                     "children": {
                                         "worker_root": {
+                                            "total": 722.2940654699773,
+                                            "count": 27274,
                                             "is_parallel": true,
+                                            "self": 337.9235702160188,
                                             "children": {
                                                 "run_training.setup": {
                                                     "total": 0.0,
                                                     "self": 0.0,
                                                     "children": {
                                                         "steps_from_proto": {
+                                                            "total": 0.001969485000017812,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0005988259999867296,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.0013706590000310825,
                                                                     "count": 10,
                                                                     "is_parallel": true,
+                                                                    "self": 0.0013706590000310825
                                                                 }
                                                             }
                                                         },
                                                         "UnityEnvironment.step": {
+                                                            "total": 0.08242344599989337,
                                                             "count": 1,
                                                             "is_parallel": true,
+                                                            "self": 0.0006884039999022207,
                                                             "children": {
                                                                 "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.00045308199992177833,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.00045308199992177833
                                                                 },
                                                                 "communicator.exchange": {
+                                                                    "total": 0.07630878300005861,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.07630878300005861
                                                                 },
                                                                 "steps_from_proto": {
+                                                                    "total": 0.0049731770000107645,
                                                                     "count": 1,
                                                                     "is_parallel": true,
+                                                                    "self": 0.002791672000057588,
                                                                     "children": {
                                                                         "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.0021815049999531766,
                                                                             "count": 10,
                                                                             "is_parallel": true,
+                                                                            "self": 0.0021815049999531766
                                                                         }
                                                                     }
                                                                 }
                                                     }
                                                 },
                                                 "UnityEnvironment.step": {
+                                                    "total": 384.37049525395855,
+                                                    "count": 27273,
                                                     "is_parallel": true,
+                                                    "self": 15.486524079959281,
                                                     "children": {
                                                         "UnityEnvironment._generate_step_input": {
+                                                            "total": 8.425367698016771,
+                                                            "count": 27273,
                                                             "is_parallel": true,
+                                                            "self": 8.425367698016771
                                                         },
                                                         "communicator.exchange": {
+                                                            "total": 305.2477889279937,
+                                                            "count": 27273,
                                                             "is_parallel": true,
+                                                            "self": 305.2477889279937
                                                         },
                                                         "steps_from_proto": {
+                                                            "total": 55.210814547988775,
+                                                            "count": 27273,
                                                             "is_parallel": true,
+                                                            "self": 10.211360998963528,
                                                             "children": {
                                                                 "_process_rank_one_or_two_observation": {
+                                                                    "total": 44.99945354902525,
+                                                                    "count": 272730,
                                                                     "is_parallel": true,
+                                                                    "self": 44.99945354902525
                                                                 }
                                                             }
                                                         }
                     }
                 },
                 "trainer_threads": {
+                    "total": 3.70650000149908e-05,
                     "count": 1,
+                    "self": 3.70650000149908e-05,
                     "children": {
                         "thread_root": {
                             "total": 0.0,
                             "self": 0.0,
                             "children": {
                                 "trainer_advance": {
+                                    "total": 714.1417267301904,
+                                    "count": 684441,
                                     "is_parallel": true,
+                                    "self": 15.42709771122577,
                                     "children": {
                                         "process_trajectory": {
+                                            "total": 390.330625886965,
+                                            "count": 684441,
                                             "is_parallel": true,
+                                            "self": 388.8141920999649,
                                             "children": {
                                                 "RLTrainer._checkpoint": {
+                                                    "total": 1.5164337870000963,
+                                                    "count": 6,
                                                     "is_parallel": true,
+                                                    "self": 1.5164337870000963
                                                 }
                                             }
                                         },
                                         "_update_policy": {
+                                            "total": 308.38400313199963,
+                                            "count": 136,
                                             "is_parallel": true,
+                                            "self": 119.26334611800644,
                                             "children": {
                                                 "TorchPPOOptimizer.update": {
+                                                    "total": 189.1206570139932,
+                                                    "count": 6933,
                                                     "is_parallel": true,
+                                                    "self": 189.1206570139932
                                                 }
                                             }
                                         }
                     }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.15758618900008514,
                     "count": 1,
+                    "self": 0.0010900650001985923,
                     "children": {
                         "RLTrainer._checkpoint": {
+                            "total": 0.15649612399988655,
                             "count": 1,
+                            "self": 0.15649612399988655
                         }
                     }
                 }

run_logs/training_status.json CHANGED Viewed

@@ -1,24 +1,6 @@
 {
     "SnowballTarget": {
         "checkpoints": [
-            {
-                "steps": 49936,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
-                "reward": 13.272727272727273,
-                "creation_time": 1688360750.9501905,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
-                ]
-            },
-            {
-                "steps": 99960,
-                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
-                "reward": 22.272727272727273,
-                "creation_time": 1688360873.446901,
-                "auxillary_file_paths": [
-                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
-                ]
-            },
             {
                 "steps": 149984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
@@ -45,15 +27,78 @@
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
             }
         ],
         "final_checkpoint": {
-            "steps": 200112,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
-            "reward": 25.454545454545453,
-            "creation_time": 1688361122.0340798,
             "auxillary_file_paths": [
-                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
             ]
         }
     },

 {
     "SnowballTarget": {
         "checkpoints": [
             {
                 "steps": 149984,
                 "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
                 "auxillary_file_paths": [
                     "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
                 ]
+            },
+            {
+                "steps": 249984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-249984.onnx",
+                "reward": 25.818181818181817,
+                "creation_time": 1688361483.6038277,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-249984.pt"
+                ]
+            },
+            {
+                "steps": 299944,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-299944.onnx",
+                "reward": 27.545454545454547,
+                "creation_time": 1688361602.0786066,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-299944.pt"
+                ]
+            },
+            {
+                "steps": 349968,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-349968.onnx",
+                "reward": 26.0,
+                "creation_time": 1688361724.4352,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-349968.pt"
+                ]
+            },
+            {
+                "steps": 399968,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-399968.onnx",
+                "reward": 27.727272727272727,
+                "creation_time": 1688361849.5447729,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-399968.pt"
+                ]
+            },
+            {
+                "steps": 449992,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-449992.onnx",
+                "reward": 26.363636363636363,
+                "creation_time": 1688361966.9275382,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-449992.pt"
+                ]
+            },
+            {
+                "steps": 499952,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-499952.onnx",
+                "reward": 26.363636363636363,
+                "creation_time": 1688362083.6424947,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-499952.pt"
+                ]
+            },
+            {
+                "steps": 500016,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-500016.onnx",
+                "reward": 26.363636363636363,
+                "creation_time": 1688362083.81968,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-500016.pt"
+                ]
             }
         ],
         "final_checkpoint": {
+            "steps": 500016,
             "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 26.363636363636363,
+            "creation_time": 1688362083.81968,
             "auxillary_file_paths": [
+                "results/SnowballTarget1/SnowballTarget/SnowballTarget-500016.pt"
             ]
         }
     },