Muhammad Saqib commited on
Commit
550b646
1 Parent(s): 2bd5b65

train on additional 1m steps

Browse files
Huggy.onnx CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:76ab4cc5c2454a034769b7600ad973c0af54d1ec46d918e0ab027c521bdbb3c5
3
  size 2273984
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fbcd8f78abb7d5c2070385f735355585353b163a32f132d5341ea6c89a5b9d4
3
  size 2273984
Huggy/Huggy-2199970.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63a4641cf414342d247d103850177a8429de99efd16f41af27e76bddd7c625ea
3
+ size 2273984
Huggy/Huggy-2199970.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fd5e18bf2ba31c54b51a714a01da0e2eb3cd6236a6331606a3e03aaf3e6c508
3
+ size 13509473
Huggy/Huggy-2399874.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d86e349b6053f96db214adb4e04687560a483a3c1291ac981a0b868eddeb6bc0
3
+ size 2273984
Huggy/Huggy-2399874.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3436cb93c88c3614865af55899b15d2c254d83bce1f88b8389af4a85d1310f1
3
+ size 13509473
Huggy/Huggy-2599974.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:110e2d32f5d0cbf3a053d03d5abd74d0c3cb45c3cc7fe5ba5869bd5ff2722096
3
+ size 2273984
Huggy/Huggy-2599974.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:18838d0540988f314c4d0546db861d75e8e7009a28811702cfbe641587ccc515
3
+ size 13509473
Huggy/Huggy-2799921.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9c380a6c5b7462ce520577edeb1aa0171e2528a05bbe2305d2f443730a5631ef
3
+ size 2273984
Huggy/Huggy-2799921.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d957ae0319ba90c9a0d47dac549bcbacbc749aac7187a697958ed32c00f730c
3
+ size 13509473
Huggy/Huggy-2999908.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:10d51d08e6ebb9dc3f536547658892366445716863d9f46b07e18cdbfb199cd2
3
+ size 2273984
Huggy/Huggy-2999908.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be7d5518395802863bc468f2cce6eed404b5c7be37331ce7c1b4a1b3cca93dc8
3
+ size 13509473
Huggy/Huggy-3000012.onnx ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0fbcd8f78abb7d5c2070385f735355585353b163a32f132d5341ea6c89a5b9d4
3
+ size 2273984
Huggy/Huggy-3000012.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:12d7bb5b669f3c77ef516066765556b6350aa3be87597284712e581baf7bca0b
3
+ size 13509473
Huggy/checkpoint.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:22bd03afe4f0777dd184f88dee622b7680a6926b73a6ebadcf97e94049c79532
3
  size 13509218
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c371157dfc1ba4c7028454ac4e81f03d27d3f733c76d9df46cfe0fe33f3be406
3
  size 13509218
Huggy/events.out.tfevents.1707229530.20a3ae5a77fc.19980.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d5b623d0b78c09f067645e4fc464ab01a72545d3a7ff8a2de0c53e9ed17d4fe
3
+ size 1121
Huggy/events.out.tfevents.1707229684.20a3ae5a77fc.20673.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca15258ea74ef91fb5ad88ac8103fd5ef958c122b4e14e9c59971959afb8cdd0
3
+ size 176578
config.json CHANGED
@@ -1 +1 @@
1
- {"default_settings": null, "behaviors": {"Huggy": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 200000, "network_settings": {"normalize": true, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 15, "even_checkpoints": false, "max_steps": 2000000, "time_horizon": 1000, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./trained-envs-executables/linux/Huggy/Huggy", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Huggy", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
 
1
+ {"default_settings": null, "behaviors": {"Huggy": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 2048, "buffer_size": 20480, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 200000, "network_settings": {"normalize": true, "hidden_units": 512, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.995, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 15, "even_checkpoints": false, "max_steps": 3000000, "time_horizon": 1000, "summary_freq": 50000, "threaded": false, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./trained-envs-executables/linux/Huggy/Huggy", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "Huggy", "initialize_from": null, "load_model": false, "resume": true, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}
configuration.yaml CHANGED
@@ -38,7 +38,7 @@ behaviors:
38
  init_path: null
39
  keep_checkpoints: 15
40
  even_checkpoints: false
41
- max_steps: 2000000
42
  time_horizon: 1000
43
  summary_freq: 50000
44
  threaded: false
@@ -69,7 +69,7 @@ checkpoint_settings:
69
  run_id: Huggy
70
  initialize_from: null
71
  load_model: false
72
- resume: false
73
  force: false
74
  train_model: false
75
  inference: false
 
38
  init_path: null
39
  keep_checkpoints: 15
40
  even_checkpoints: false
41
+ max_steps: 3000000
42
  time_horizon: 1000
43
  summary_freq: 50000
44
  threaded: false
 
69
  run_id: Huggy
70
  initialize_from: null
71
  load_model: false
72
+ resume: true
73
  force: false
74
  train_model: false
75
  inference: false
run_logs/Player-0.log CHANGED
@@ -2,9 +2,6 @@ Mono path[0] = '/content/ml-agents/trained-envs-executables/linux/Huggy/Huggy_Da
2
  Mono config path = '/content/ml-agents/trained-envs-executables/linux/Huggy/Huggy_Data/MonoBleedingEdge/etc'
3
  Preloaded 'lib_burst_generated.so'
4
  Preloaded 'libgrpc_csharp_ext.x64.so'
5
- PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face
6
- PlayerPrefs - Creating folder: /root/.config/unity3d/Hugging Face/Huggy
7
- Unable to load player prefs
8
  Initialize engine version: 2021.3.14f1 (eee1884e7226)
9
  [Subsystems] Discovering subsystems at path /content/ml-agents/trained-envs-executables/linux/Huggy/Huggy_Data/UnitySubsystems
10
  Forcing GfxDevice: Null
@@ -34,7 +31,7 @@ ALSA lib pcm.c:2664:(snd_pcm_open_noupdate) Unknown PCM default
34
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
35
  FMOD initialized on nosound output
36
  Begin MonoManager ReloadAssembly
37
- - Completed reload, in 0.088 seconds
38
  ERROR: Shader Hidden/Universal Render Pipeline/Blit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
39
  ERROR: Shader Hidden/Universal Render Pipeline/CopyDepth shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
40
  ERROR: Shader Hidden/Universal Render Pipeline/ScreenSpaceShadows shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
@@ -78,14 +75,14 @@ ERROR: Shader Universal Render Pipeline/Lit shader is not supported on this GPU
78
  WARNING: Shader Unsupported: 'Universal Render Pipeline/Lit' - All subshaders removed
79
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
80
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
81
- UnloadTime: 0.773317 ms
82
  requesting resize 84 x 84
83
  Setting up 1 worker threads for Enlighten.
84
  Memory Statistics:
85
  [ALLOC_TEMP_TLS] TLS Allocator
86
  StackAllocators :
87
  [ALLOC_TEMP_MAIN]
88
- Peak usage frame count: [4.0 KB-8.0 KB]: 26755 frames, [2.0 MB-4.0 MB]: 1 frames
89
  Initial Block Size 4.0 MB
90
  Current Block Size 4.0 MB
91
  Peak Allocated Bytes 3.6 MB
@@ -93,7 +90,7 @@ Memory Statistics:
93
  [ALLOC_TEMP_Loading.AsyncRead]
94
  Initial Block Size 64.0 KB
95
  Current Block Size 64.0 KB
96
- Peak Allocated Bytes 152 B
97
  Overflow Count 0
98
  [ALLOC_TEMP_Loading.PreloadManager]
99
  Initial Block Size 256.0 KB
@@ -201,22 +198,22 @@ Memory Statistics:
201
  Peak Allocated Bytes 0 B
202
  Overflow Count 0
203
  [ALLOC_DEFAULT] Dual Thread Allocator
204
- Peak main deferred allocation count 212
205
  [ALLOC_BUCKET]
206
  Large Block size 4.0 MB
207
  Used Block count 1
208
  Peak Allocated bytes 1.4 MB
209
  [ALLOC_DEFAULT_MAIN]
210
- Peak usage frame count: [16.0 MB-32.0 MB]: 26756 frames
211
  Requested Block Size 16.0 MB
212
  Peak Block count 1
213
- Peak Allocated memory 23.5 MB
214
  Peak Large allocation bytes 16.0 MB
215
  [ALLOC_DEFAULT_THREAD]
216
- Peak usage frame count: [2.0 MB-4.0 MB]: 26756 frames
217
  Requested Block Size 16.0 MB
218
  Peak Block count 1
219
- Peak Allocated memory 2.6 MB
220
  Peak Large allocation bytes 0 B
221
  [ALLOC_TEMP_JOB_1_FRAME]
222
  Initial Block Size 2.0 MB
@@ -245,13 +242,13 @@ Memory Statistics:
245
  Used Block count 1
246
  Peak Allocated bytes 1.4 MB
247
  [ALLOC_GFX_MAIN]
248
- Peak usage frame count: [32.0 KB-64.0 KB]: 26755 frames, [64.0 KB-128.0 KB]: 1 frames
249
  Requested Block Size 16.0 MB
250
  Peak Block count 1
251
  Peak Allocated memory 65.6 KB
252
  Peak Large allocation bytes 0 B
253
  [ALLOC_GFX_THREAD]
254
- Peak usage frame count: [64.0 KB-128.0 KB]: 26756 frames
255
  Requested Block Size 16.0 MB
256
  Peak Block count 1
257
  Peak Allocated memory 81.8 KB
@@ -263,13 +260,13 @@ Memory Statistics:
263
  Used Block count 1
264
  Peak Allocated bytes 1.4 MB
265
  [ALLOC_CACHEOBJECTS_MAIN]
266
- Peak usage frame count: [1.0 MB-2.0 MB]: 26755 frames, [16.0 MB-32.0 MB]: 1 frames
267
  Requested Block Size 4.0 MB
268
  Peak Block count 2
269
  Peak Allocated memory 30.6 MB
270
  Peak Large allocation bytes 24.9 MB
271
  [ALLOC_CACHEOBJECTS_THREAD]
272
- Peak usage frame count: [0.5 MB-1.0 MB]: 26755 frames, [2.0 MB-4.0 MB]: 1 frames
273
  Requested Block Size 4.0 MB
274
  Peak Block count 1
275
  Peak Allocated memory 2.6 MB
@@ -281,13 +278,13 @@ Memory Statistics:
281
  Used Block count 1
282
  Peak Allocated bytes 1.4 MB
283
  [ALLOC_TYPETREE_MAIN]
284
- Peak usage frame count: [0-1.0 KB]: 26756 frames
285
  Requested Block Size 2.0 MB
286
  Peak Block count 1
287
  Peak Allocated memory 1.0 KB
288
  Peak Large allocation bytes 0 B
289
  [ALLOC_TYPETREE_THREAD]
290
- Peak usage frame count: [4.0 KB-8.0 KB]: 26756 frames
291
  Requested Block Size 2.0 MB
292
  Peak Block count 1
293
  Peak Allocated memory 7.3 KB
 
2
  Mono config path = '/content/ml-agents/trained-envs-executables/linux/Huggy/Huggy_Data/MonoBleedingEdge/etc'
3
  Preloaded 'lib_burst_generated.so'
4
  Preloaded 'libgrpc_csharp_ext.x64.so'
 
 
 
5
  Initialize engine version: 2021.3.14f1 (eee1884e7226)
6
  [Subsystems] Discovering subsystems at path /content/ml-agents/trained-envs-executables/linux/Huggy/Huggy_Data/UnitySubsystems
7
  Forcing GfxDevice: Null
 
31
  FMOD failed to initialize the output device.: "Error initializing output device. " (60)
32
  FMOD initialized on nosound output
33
  Begin MonoManager ReloadAssembly
34
+ - Completed reload, in 0.101 seconds
35
  ERROR: Shader Hidden/Universal Render Pipeline/Blit shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
36
  ERROR: Shader Hidden/Universal Render Pipeline/CopyDepth shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
37
  ERROR: Shader Hidden/Universal Render Pipeline/ScreenSpaceShadows shader is not supported on this GPU (none of subshaders/fallbacks are suitable)
 
75
  WARNING: Shader Unsupported: 'Universal Render Pipeline/Lit' - All subshaders removed
76
  WARNING: Shader Did you use #pragma only_renderers and omit this platform?
77
  WARNING: Shader If subshaders removal was intentional, you may have forgotten turning Fallback off?
78
+ UnloadTime: 0.783364 ms
79
  requesting resize 84 x 84
80
  Setting up 1 worker threads for Enlighten.
81
  Memory Statistics:
82
  [ALLOC_TEMP_TLS] TLS Allocator
83
  StackAllocators :
84
  [ALLOC_TEMP_MAIN]
85
+ Peak usage frame count: [4.0 KB-8.0 KB]: 13418 frames, [2.0 MB-4.0 MB]: 1 frames
86
  Initial Block Size 4.0 MB
87
  Current Block Size 4.0 MB
88
  Peak Allocated Bytes 3.6 MB
 
90
  [ALLOC_TEMP_Loading.AsyncRead]
91
  Initial Block Size 64.0 KB
92
  Current Block Size 64.0 KB
93
+ Peak Allocated Bytes 176 B
94
  Overflow Count 0
95
  [ALLOC_TEMP_Loading.PreloadManager]
96
  Initial Block Size 256.0 KB
 
198
  Peak Allocated Bytes 0 B
199
  Overflow Count 0
200
  [ALLOC_DEFAULT] Dual Thread Allocator
201
+ Peak main deferred allocation count 326
202
  [ALLOC_BUCKET]
203
  Large Block size 4.0 MB
204
  Used Block count 1
205
  Peak Allocated bytes 1.4 MB
206
  [ALLOC_DEFAULT_MAIN]
207
+ Peak usage frame count: [16.0 MB-32.0 MB]: 13419 frames
208
  Requested Block Size 16.0 MB
209
  Peak Block count 1
210
+ Peak Allocated memory 23.2 MB
211
  Peak Large allocation bytes 16.0 MB
212
  [ALLOC_DEFAULT_THREAD]
213
+ Peak usage frame count: [2.0 MB-4.0 MB]: 13419 frames
214
  Requested Block Size 16.0 MB
215
  Peak Block count 1
216
+ Peak Allocated memory 2.5 MB
217
  Peak Large allocation bytes 0 B
218
  [ALLOC_TEMP_JOB_1_FRAME]
219
  Initial Block Size 2.0 MB
 
242
  Used Block count 1
243
  Peak Allocated bytes 1.4 MB
244
  [ALLOC_GFX_MAIN]
245
+ Peak usage frame count: [32.0 KB-64.0 KB]: 13418 frames, [64.0 KB-128.0 KB]: 1 frames
246
  Requested Block Size 16.0 MB
247
  Peak Block count 1
248
  Peak Allocated memory 65.6 KB
249
  Peak Large allocation bytes 0 B
250
  [ALLOC_GFX_THREAD]
251
+ Peak usage frame count: [64.0 KB-128.0 KB]: 13419 frames
252
  Requested Block Size 16.0 MB
253
  Peak Block count 1
254
  Peak Allocated memory 81.8 KB
 
260
  Used Block count 1
261
  Peak Allocated bytes 1.4 MB
262
  [ALLOC_CACHEOBJECTS_MAIN]
263
+ Peak usage frame count: [1.0 MB-2.0 MB]: 13418 frames, [16.0 MB-32.0 MB]: 1 frames
264
  Requested Block Size 4.0 MB
265
  Peak Block count 2
266
  Peak Allocated memory 30.6 MB
267
  Peak Large allocation bytes 24.9 MB
268
  [ALLOC_CACHEOBJECTS_THREAD]
269
+ Peak usage frame count: [0.5 MB-1.0 MB]: 13418 frames, [2.0 MB-4.0 MB]: 1 frames
270
  Requested Block Size 4.0 MB
271
  Peak Block count 1
272
  Peak Allocated memory 2.6 MB
 
278
  Used Block count 1
279
  Peak Allocated bytes 1.4 MB
280
  [ALLOC_TYPETREE_MAIN]
281
+ Peak usage frame count: [0-1.0 KB]: 13419 frames
282
  Requested Block Size 2.0 MB
283
  Peak Block count 1
284
  Peak Allocated memory 1.0 KB
285
  Peak Large allocation bytes 0 B
286
  [ALLOC_TYPETREE_THREAD]
287
+ Peak usage frame count: [4.0 KB-8.0 KB]: 13419 frames
288
  Requested Block Size 2.0 MB
289
  Peak Block count 1
290
  Peak Allocated memory 7.3 KB
run_logs/timers.json CHANGED
@@ -2,213 +2,213 @@
2
  "name": "root",
3
  "gauges": {
4
  "Huggy.Policy.Entropy.mean": {
5
- "value": 1.40479576587677,
6
- "min": 1.40479576587677,
7
- "max": 1.4262832403182983,
8
- "count": 40
9
  },
10
  "Huggy.Policy.Entropy.sum": {
11
- "value": 70746.921875,
12
- "min": 68906.0859375,
13
- "max": 77985.328125,
14
- "count": 40
15
  },
16
  "Huggy.Environment.EpisodeLength.mean": {
17
- "value": 76.35085007727976,
18
- "min": 74.21385542168674,
19
- "max": 386.5615384615385,
20
- "count": 40
21
  },
22
  "Huggy.Environment.EpisodeLength.sum": {
23
- "value": 49399.0,
24
- "min": 49278.0,
25
- "max": 50253.0,
26
- "count": 40
27
  },
28
  "Huggy.Step.mean": {
29
- "value": 1999987.0,
30
- "min": 49991.0,
31
- "max": 1999987.0,
32
- "count": 40
33
  },
34
  "Huggy.Step.sum": {
35
- "value": 1999987.0,
36
- "min": 49991.0,
37
- "max": 1999987.0,
38
- "count": 40
39
  },
40
  "Huggy.Policy.ExtrinsicValueEstimate.mean": {
41
- "value": 2.4954729080200195,
42
- "min": 0.10935484617948532,
43
- "max": 2.5171620845794678,
44
- "count": 40
45
  },
46
  "Huggy.Policy.ExtrinsicValueEstimate.sum": {
47
- "value": 1614.571044921875,
48
- "min": 14.106775283813477,
49
- "max": 1650.9215087890625,
50
- "count": 40
51
  },
52
  "Huggy.Environment.CumulativeReward.mean": {
53
- "value": 3.9151884355169178,
54
- "min": 1.7759710487931273,
55
- "max": 4.0382681907269,
56
- "count": 40
57
  },
58
  "Huggy.Environment.CumulativeReward.sum": {
59
- "value": 2533.1269177794456,
60
- "min": 229.10026529431343,
61
- "max": 2586.368226826191,
62
- "count": 40
63
  },
64
  "Huggy.Policy.ExtrinsicReward.mean": {
65
- "value": 3.9151884355169178,
66
- "min": 1.7759710487931273,
67
- "max": 4.0382681907269,
68
- "count": 40
69
  },
70
  "Huggy.Policy.ExtrinsicReward.sum": {
71
- "value": 2533.1269177794456,
72
- "min": 229.10026529431343,
73
- "max": 2586.368226826191,
74
- "count": 40
75
  },
76
  "Huggy.Losses.PolicyLoss.mean": {
77
- "value": 0.019103528304711088,
78
- "min": 0.014227674743203049,
79
- "max": 0.020454438457575937,
80
- "count": 40
81
  },
82
  "Huggy.Losses.PolicyLoss.sum": {
83
- "value": 0.05731058491413326,
84
- "min": 0.028455349486406097,
85
- "max": 0.057827948908864835,
86
- "count": 40
87
  },
88
  "Huggy.Losses.ValueLoss.mean": {
89
- "value": 0.05863657374348905,
90
- "min": 0.02132847082490722,
91
- "max": 0.0604518906523784,
92
- "count": 40
93
  },
94
  "Huggy.Losses.ValueLoss.sum": {
95
- "value": 0.17590972123046716,
96
- "min": 0.04265694164981444,
97
- "max": 0.1813556719571352,
98
- "count": 40
99
  },
100
  "Huggy.Policy.LearningRate.mean": {
101
- "value": 3.6815987728333375e-06,
102
- "min": 3.6815987728333375e-06,
103
- "max": 0.0002953593765468749,
104
- "count": 40
105
  },
106
  "Huggy.Policy.LearningRate.sum": {
107
- "value": 1.1044796318500013e-05,
108
- "min": 1.1044796318500013e-05,
109
- "max": 0.0008440443186519,
110
- "count": 40
111
  },
112
  "Huggy.Policy.Epsilon.mean": {
113
- "value": 0.10122716666666669,
114
- "min": 0.10122716666666669,
115
- "max": 0.19845312500000006,
116
- "count": 40
117
  },
118
  "Huggy.Policy.Epsilon.sum": {
119
- "value": 0.30368150000000005,
120
- "min": 0.2076262,
121
- "max": 0.5813480999999999,
122
- "count": 40
123
  },
124
  "Huggy.Policy.Beta.mean": {
125
- "value": 7.123561666666675e-05,
126
- "min": 7.123561666666675e-05,
127
- "max": 0.004922810937499999,
128
- "count": 40
129
  },
130
  "Huggy.Policy.Beta.sum": {
131
- "value": 0.00021370685000000024,
132
- "min": 0.00021370685000000024,
133
- "max": 0.014069270190000002,
134
- "count": 40
135
  },
136
  "Huggy.IsTraining.mean": {
137
  "value": 1.0,
138
  "min": 1.0,
139
  "max": 1.0,
140
- "count": 40
141
  },
142
  "Huggy.IsTraining.sum": {
143
  "value": 1.0,
144
  "min": 1.0,
145
  "max": 1.0,
146
- "count": 40
147
  }
148
  },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
- "start_time_seconds": "1707226407",
152
  "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
153
- "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy --no-graphics",
154
  "mlagents_version": "1.1.0.dev0",
155
  "mlagents_envs_version": "1.1.0.dev0",
156
  "communication_protocol_version": "1.5.0",
157
  "pytorch_version": "2.2.0+cu121",
158
  "numpy_version": "1.23.5",
159
- "end_time_seconds": "1707228817"
160
  },
161
- "total": 2409.440081134,
162
  "count": 1,
163
- "self": 0.44169744000009814,
164
  "children": {
165
  "run_training.setup": {
166
- "total": 0.04923977999987983,
167
  "count": 1,
168
- "self": 0.04923977999987983
169
  },
170
  "TrainerController.start_learning": {
171
- "total": 2408.949143914,
172
  "count": 1,
173
- "self": 4.509431323028366,
174
  "children": {
175
  "TrainerController._reset_env": {
176
- "total": 2.9892884610001147,
177
  "count": 1,
178
- "self": 2.9892884610001147
179
  },
180
  "TrainerController.advance": {
181
- "total": 2401.323403468972,
182
- "count": 233222,
183
- "self": 4.9041543729199475,
184
  "children": {
185
  "env_step": {
186
- "total": 1939.5104788280173,
187
- "count": 233222,
188
- "self": 1609.9971716006812,
189
  "children": {
190
  "SubprocessEnvManager._take_step": {
191
- "total": 326.6790022380692,
192
- "count": 233222,
193
- "self": 16.749791363120494,
194
  "children": {
195
  "TorchPolicy.evaluate": {
196
- "total": 309.9292108749487,
197
- "count": 222963,
198
- "self": 309.9292108749487
199
  }
200
  }
201
  },
202
  "workers": {
203
- "total": 2.8343049892669114,
204
- "count": 233222,
205
  "self": 0.0,
206
  "children": {
207
  "worker_root": {
208
- "total": 2401.659049063007,
209
- "count": 233222,
210
  "is_parallel": true,
211
- "self": 1088.6713370230154,
212
  "children": {
213
  "run_training.setup": {
214
  "total": 0.0,
@@ -217,48 +217,48 @@
217
  "self": 0.0,
218
  "children": {
219
  "steps_from_proto": {
220
- "total": 0.0009009340001284727,
221
  "count": 1,
222
  "is_parallel": true,
223
- "self": 0.00025307400005658565,
224
  "children": {
225
  "_process_rank_one_or_two_observation": {
226
- "total": 0.000647860000071887,
227
  "count": 2,
228
  "is_parallel": true,
229
- "self": 0.000647860000071887
230
  }
231
  }
232
  },
233
  "UnityEnvironment.step": {
234
- "total": 0.032897016000106305,
235
  "count": 1,
236
  "is_parallel": true,
237
- "self": 0.00039493999975093175,
238
  "children": {
239
  "UnityEnvironment._generate_step_input": {
240
- "total": 0.00025312900015705964,
241
  "count": 1,
242
  "is_parallel": true,
243
- "self": 0.00025312900015705964
244
  },
245
  "communicator.exchange": {
246
- "total": 0.03144854800007124,
247
  "count": 1,
248
  "is_parallel": true,
249
- "self": 0.03144854800007124
250
  },
251
  "steps_from_proto": {
252
- "total": 0.0008003990001270722,
253
  "count": 1,
254
  "is_parallel": true,
255
- "self": 0.00020498000026236696,
256
  "children": {
257
  "_process_rank_one_or_two_observation": {
258
- "total": 0.0005954189998647053,
259
  "count": 2,
260
  "is_parallel": true,
261
- "self": 0.0005954189998647053
262
  }
263
  }
264
  }
@@ -267,34 +267,34 @@
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
- "total": 1312.9877120399915,
271
- "count": 233221,
272
  "is_parallel": true,
273
- "self": 41.25639111639907,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
- "total": 85.96511211693633,
277
- "count": 233221,
278
  "is_parallel": true,
279
- "self": 85.96511211693633
280
  },
281
  "communicator.exchange": {
282
- "total": 1092.4745247058486,
283
- "count": 233221,
284
  "is_parallel": true,
285
- "self": 1092.4745247058486
286
  },
287
  "steps_from_proto": {
288
- "total": 93.29168410080752,
289
- "count": 233221,
290
  "is_parallel": true,
291
- "self": 34.65772516784432,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
- "total": 58.633958932963196,
295
- "count": 466442,
296
  "is_parallel": true,
297
- "self": 58.633958932963196
298
  }
299
  }
300
  }
@@ -307,31 +307,31 @@
307
  }
308
  },
309
  "trainer_advance": {
310
- "total": 456.90877026803514,
311
- "count": 233222,
312
- "self": 6.625547788050881,
313
  "children": {
314
  "process_trajectory": {
315
- "total": 158.5469349989853,
316
- "count": 233222,
317
- "self": 157.33874496698422,
318
  "children": {
319
  "RLTrainer._checkpoint": {
320
- "total": 1.2081900320010845,
321
- "count": 10,
322
- "self": 1.2081900320010845
323
  }
324
  }
325
  },
326
  "_update_policy": {
327
- "total": 291.73628748099895,
328
- "count": 97,
329
- "self": 231.13104093599577,
330
  "children": {
331
  "TorchPPOOptimizer.update": {
332
- "total": 60.60524654500318,
333
- "count": 2910,
334
- "self": 60.60524654500318
335
  }
336
  }
337
  }
@@ -340,19 +340,19 @@
340
  }
341
  },
342
  "trainer_threads": {
343
- "total": 1.3639996723213699e-06,
344
  "count": 1,
345
- "self": 1.3639996723213699e-06
346
  },
347
  "TrainerController._save_models": {
348
- "total": 0.12701929700006076,
349
  "count": 1,
350
- "self": 0.002057402000446018,
351
  "children": {
352
  "RLTrainer._checkpoint": {
353
- "total": 0.12496189499961474,
354
  "count": 1,
355
- "self": 0.12496189499961474
356
  }
357
  }
358
  }
 
2
  "name": "root",
3
  "gauges": {
4
  "Huggy.Policy.Entropy.mean": {
5
+ "value": 1.4002948999404907,
6
+ "min": 1.400290846824646,
7
+ "max": 1.4044567346572876,
8
+ "count": 20
9
  },
10
  "Huggy.Policy.Entropy.sum": {
11
+ "value": 70707.890625,
12
+ "min": 68126.109375,
13
+ "max": 71574.140625,
14
+ "count": 20
15
  },
16
  "Huggy.Environment.EpisodeLength.mean": {
17
+ "value": 92.73170731707317,
18
+ "min": 66.15725806451613,
19
+ "max": 92.73170731707317,
20
+ "count": 20
21
  },
22
  "Huggy.Environment.EpisodeLength.sum": {
23
+ "value": 49426.0,
24
+ "min": 49221.0,
25
+ "max": 49556.0,
26
+ "count": 20
27
  },
28
  "Huggy.Step.mean": {
29
+ "value": 2999908.0,
30
+ "min": 2049981.0,
31
+ "max": 2999908.0,
32
+ "count": 20
33
  },
34
  "Huggy.Step.sum": {
35
+ "value": 2999908.0,
36
+ "min": 2049981.0,
37
+ "max": 2999908.0,
38
+ "count": 20
39
  },
40
  "Huggy.Policy.ExtrinsicValueEstimate.mean": {
41
+ "value": 2.4432694911956787,
42
+ "min": 2.442089557647705,
43
+ "max": 2.5468037128448486,
44
+ "count": 20
45
  },
46
  "Huggy.Policy.ExtrinsicValueEstimate.sum": {
47
+ "value": 1302.2626953125,
48
+ "min": 1302.2626953125,
49
+ "max": 1863.03515625,
50
+ "count": 20
51
  },
52
  "Huggy.Environment.CumulativeReward.mean": {
53
+ "value": 3.7131219303853964,
54
+ "min": 3.7131219303853964,
55
+ "max": 4.026137485445201,
56
+ "count": 20
57
  },
58
  "Huggy.Environment.CumulativeReward.sum": {
59
+ "value": 1979.0939888954163,
60
+ "min": 1979.0939888954163,
61
+ "max": 2931.028089404106,
62
+ "count": 20
63
  },
64
  "Huggy.Policy.ExtrinsicReward.mean": {
65
+ "value": 3.7131219303853964,
66
+ "min": 3.7131219303853964,
67
+ "max": 4.026137485445201,
68
+ "count": 20
69
  },
70
  "Huggy.Policy.ExtrinsicReward.sum": {
71
+ "value": 1979.0939888954163,
72
+ "min": 1979.0939888954163,
73
+ "max": 2931.028089404106,
74
+ "count": 20
75
  },
76
  "Huggy.Losses.PolicyLoss.mean": {
77
+ "value": 0.016497817036967413,
78
+ "min": 0.014403317138850171,
79
+ "max": 0.021526213961381775,
80
+ "count": 20
81
  },
82
  "Huggy.Losses.PolicyLoss.sum": {
83
+ "value": 0.032995634073934826,
84
+ "min": 0.03035465927775173,
85
+ "max": 0.056156814580026554,
86
+ "count": 20
87
  },
88
  "Huggy.Losses.ValueLoss.mean": {
89
+ "value": 0.047286525989572205,
90
+ "min": 0.047286525989572205,
91
+ "max": 0.0675045739238461,
92
+ "count": 20
93
  },
94
  "Huggy.Losses.ValueLoss.sum": {
95
+ "value": 0.09457305197914441,
96
+ "min": 0.09457305197914441,
97
+ "max": 0.18123736369113128,
98
+ "count": 20
99
  },
100
  "Huggy.Policy.LearningRate.mean": {
101
+ "value": 2.3148492284166755e-06,
102
+ "min": 2.3148492284166755e-06,
103
+ "max": 9.691496769503332e-05,
104
+ "count": 20
105
  },
106
  "Huggy.Policy.LearningRate.sum": {
107
+ "value": 4.629698456833351e-06,
108
+ "min": 4.629698456833351e-06,
109
+ "max": 0.00026304131231963336,
110
+ "count": 20
111
  },
112
  "Huggy.Policy.Epsilon.mean": {
113
+ "value": 0.10077158333333334,
114
+ "min": 0.10077158333333334,
115
+ "max": 0.1323049666666667,
116
+ "count": 20
117
  },
118
  "Huggy.Policy.Epsilon.sum": {
119
+ "value": 0.2015431666666667,
120
+ "min": 0.2015431666666667,
121
+ "max": 0.3876803666666667,
122
+ "count": 20
123
  },
124
  "Huggy.Policy.Beta.mean": {
125
+ "value": 4.850200833333351e-05,
126
+ "min": 4.850200833333351e-05,
127
+ "max": 0.0016220178366666666,
128
+ "count": 20
129
  },
130
  "Huggy.Policy.Beta.sum": {
131
+ "value": 9.700401666666702e-05,
132
+ "min": 9.700401666666702e-05,
133
+ "max": 0.004405250296666668,
134
+ "count": 20
135
  },
136
  "Huggy.IsTraining.mean": {
137
  "value": 1.0,
138
  "min": 1.0,
139
  "max": 1.0,
140
+ "count": 20
141
  },
142
  "Huggy.IsTraining.sum": {
143
  "value": 1.0,
144
  "min": 1.0,
145
  "max": 1.0,
146
+ "count": 20
147
  }
148
  },
149
  "metadata": {
150
  "timer_format_version": "0.1.0",
151
+ "start_time_seconds": "1707229684",
152
  "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
153
+ "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/Huggy.yaml --env=./trained-envs-executables/linux/Huggy/Huggy --run-id=Huggy --no-graphics --resume",
154
  "mlagents_version": "1.1.0.dev0",
155
  "mlagents_envs_version": "1.1.0.dev0",
156
  "communication_protocol_version": "1.5.0",
157
  "pytorch_version": "2.2.0+cu121",
158
  "numpy_version": "1.23.5",
159
+ "end_time_seconds": "1707230903"
160
  },
161
+ "total": 1219.2884672870005,
162
  "count": 1,
163
+ "self": 0.4370836470006907,
164
  "children": {
165
  "run_training.setup": {
166
+ "total": 0.04692796699964674,
167
  "count": 1,
168
+ "self": 0.04692796699964674
169
  },
170
  "TrainerController.start_learning": {
171
+ "total": 1218.8044556730001,
172
  "count": 1,
173
+ "self": 2.343180128024869,
174
  "children": {
175
  "TrainerController._reset_env": {
176
+ "total": 2.1479978630004553,
177
  "count": 1,
178
+ "self": 2.1479978630004553
179
  },
180
  "TrainerController.advance": {
181
+ "total": 1214.1848600489748,
182
+ "count": 118128,
183
+ "self": 2.452056089875441,
184
  "children": {
185
  "env_step": {
186
+ "total": 974.6812306079783,
187
+ "count": 118128,
188
+ "self": 807.4357161978896,
189
  "children": {
190
  "SubprocessEnvManager._take_step": {
191
+ "total": 165.77706546212357,
192
+ "count": 118128,
193
+ "self": 8.387665497116359,
194
  "children": {
195
  "TorchPolicy.evaluate": {
196
+ "total": 157.38939996500721,
197
+ "count": 111823,
198
+ "self": 157.38939996500721
199
  }
200
  }
201
  },
202
  "workers": {
203
+ "total": 1.4684489479650438,
204
+ "count": 118128,
205
  "self": 0.0,
206
  "children": {
207
  "worker_root": {
208
+ "total": 1214.8518558820324,
209
+ "count": 118128,
210
  "is_parallel": true,
211
+ "self": 556.5244112889222,
212
  "children": {
213
  "run_training.setup": {
214
  "total": 0.0,
 
217
  "self": 0.0,
218
  "children": {
219
  "steps_from_proto": {
220
+ "total": 0.0011551730003702687,
221
  "count": 1,
222
  "is_parallel": true,
223
+ "self": 0.00035466300050757127,
224
  "children": {
225
  "_process_rank_one_or_two_observation": {
226
+ "total": 0.0008005099998626974,
227
  "count": 2,
228
  "is_parallel": true,
229
+ "self": 0.0008005099998626974
230
  }
231
  }
232
  },
233
  "UnityEnvironment.step": {
234
+ "total": 0.02979850100018666,
235
  "count": 1,
236
  "is_parallel": true,
237
+ "self": 0.0003212329993402818,
238
  "children": {
239
  "UnityEnvironment._generate_step_input": {
240
+ "total": 0.00020562200006679632,
241
  "count": 1,
242
  "is_parallel": true,
243
+ "self": 0.00020562200006679632
244
  },
245
  "communicator.exchange": {
246
+ "total": 0.028506298000138486,
247
  "count": 1,
248
  "is_parallel": true,
249
+ "self": 0.028506298000138486
250
  },
251
  "steps_from_proto": {
252
+ "total": 0.0007653480006410973,
253
  "count": 1,
254
  "is_parallel": true,
255
+ "self": 0.00022463200002675876,
256
  "children": {
257
  "_process_rank_one_or_two_observation": {
258
+ "total": 0.0005407160006143386,
259
  "count": 2,
260
  "is_parallel": true,
261
+ "self": 0.0005407160006143386
262
  }
263
  }
264
  }
 
267
  }
268
  },
269
  "UnityEnvironment.step": {
270
+ "total": 658.3274445931102,
271
+ "count": 118127,
272
  "is_parallel": true,
273
+ "self": 20.83874480905888,
274
  "children": {
275
  "UnityEnvironment._generate_step_input": {
276
+ "total": 43.2128352530126,
277
+ "count": 118127,
278
  "is_parallel": true,
279
+ "self": 43.2128352530126
280
  },
281
  "communicator.exchange": {
282
+ "total": 547.4930454870992,
283
+ "count": 118127,
284
  "is_parallel": true,
285
+ "self": 547.4930454870992
286
  },
287
  "steps_from_proto": {
288
+ "total": 46.782819043939526,
289
+ "count": 118127,
290
  "is_parallel": true,
291
+ "self": 17.487023304808645,
292
  "children": {
293
  "_process_rank_one_or_two_observation": {
294
+ "total": 29.29579573913088,
295
+ "count": 236254,
296
  "is_parallel": true,
297
+ "self": 29.29579573913088
298
  }
299
  }
300
  }
 
307
  }
308
  },
309
  "trainer_advance": {
310
+ "total": 237.05157335112108,
311
+ "count": 118128,
312
+ "self": 3.40058024413338,
313
  "children": {
314
  "process_trajectory": {
315
+ "total": 86.32439864298885,
316
+ "count": 118128,
317
+ "self": 85.67243265498837,
318
  "children": {
319
  "RLTrainer._checkpoint": {
320
+ "total": 0.6519659880004838,
321
+ "count": 5,
322
+ "self": 0.6519659880004838
323
  }
324
  }
325
  },
326
  "_update_policy": {
327
+ "total": 147.32659446399884,
328
+ "count": 48,
329
+ "self": 116.61226426998746,
330
  "children": {
331
  "TorchPPOOptimizer.update": {
332
+ "total": 30.71433019401138,
333
+ "count": 1440,
334
+ "self": 30.71433019401138
335
  }
336
  }
337
  }
 
340
  }
341
  },
342
  "trainer_threads": {
343
+ "total": 1.5639998309779912e-06,
344
  "count": 1,
345
+ "self": 1.5639998309779912e-06
346
  },
347
  "TrainerController._save_models": {
348
+ "total": 0.12841606900019542,
349
  "count": 1,
350
+ "self": 0.0030520170003001112,
351
  "children": {
352
  "RLTrainer._checkpoint": {
353
+ "total": 0.1253640519998953,
354
  "count": 1,
355
+ "self": 0.1253640519998953
356
  }
357
  }
358
  }
run_logs/training_status.json CHANGED
@@ -1,33 +1,6 @@
1
  {
2
  "Huggy": {
3
  "checkpoints": [
4
- {
5
- "steps": 199955,
6
- "file_path": "results/Huggy/Huggy/Huggy-199955.onnx",
7
- "reward": 3.8129177585480707,
8
- "creation_time": 1707226645.5971615,
9
- "auxillary_file_paths": [
10
- "results/Huggy/Huggy/Huggy-199955.pt"
11
- ]
12
- },
13
- {
14
- "steps": 399953,
15
- "file_path": "results/Huggy/Huggy/Huggy-399953.onnx",
16
- "reward": 3.5436155513713232,
17
- "creation_time": 1707226884.371544,
18
- "auxillary_file_paths": [
19
- "results/Huggy/Huggy/Huggy-399953.pt"
20
- ]
21
- },
22
- {
23
- "steps": 599972,
24
- "file_path": "results/Huggy/Huggy/Huggy-599972.onnx",
25
- "reward": 4.225136029092889,
26
- "creation_time": 1707227124.4800828,
27
- "auxillary_file_paths": [
28
- "results/Huggy/Huggy/Huggy-599972.pt"
29
- ]
30
- },
31
  {
32
  "steps": 799987,
33
  "file_path": "results/Huggy/Huggy/Huggy-799987.onnx",
@@ -99,15 +72,78 @@
99
  "auxillary_file_paths": [
100
  "results/Huggy/Huggy/Huggy-2000079.pt"
101
  ]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
102
  }
103
  ],
104
  "final_checkpoint": {
105
- "steps": 2000079,
106
  "file_path": "results/Huggy/Huggy.onnx",
107
- "reward": 4.344622765887867,
108
- "creation_time": 1707228816.7219145,
109
  "auxillary_file_paths": [
110
- "results/Huggy/Huggy/Huggy-2000079.pt"
111
  ]
112
  }
113
  },
 
1
  {
2
  "Huggy": {
3
  "checkpoints": [
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4
  {
5
  "steps": 799987,
6
  "file_path": "results/Huggy/Huggy/Huggy-799987.onnx",
 
72
  "auxillary_file_paths": [
73
  "results/Huggy/Huggy/Huggy-2000079.pt"
74
  ]
75
+ },
76
+ {
77
+ "steps": 2000079,
78
+ "file_path": "results/Huggy/Huggy/Huggy-2000079.onnx",
79
+ "reward": null,
80
+ "creation_time": 1707229532.083456,
81
+ "auxillary_file_paths": [
82
+ "results/Huggy/Huggy/Huggy-2000079.pt"
83
+ ]
84
+ },
85
+ {
86
+ "steps": 2199970,
87
+ "file_path": "results/Huggy/Huggy/Huggy-2199970.onnx",
88
+ "reward": 3.867090335268995,
89
+ "creation_time": 1707229928.373752,
90
+ "auxillary_file_paths": [
91
+ "results/Huggy/Huggy/Huggy-2199970.pt"
92
+ ]
93
+ },
94
+ {
95
+ "steps": 2399874,
96
+ "file_path": "results/Huggy/Huggy/Huggy-2399874.onnx",
97
+ "reward": 4.00003276743106,
98
+ "creation_time": 1707230173.364886,
99
+ "auxillary_file_paths": [
100
+ "results/Huggy/Huggy/Huggy-2399874.pt"
101
+ ]
102
+ },
103
+ {
104
+ "steps": 2599974,
105
+ "file_path": "results/Huggy/Huggy/Huggy-2599974.onnx",
106
+ "reward": 4.05236953496933,
107
+ "creation_time": 1707230418.801743,
108
+ "auxillary_file_paths": [
109
+ "results/Huggy/Huggy/Huggy-2599974.pt"
110
+ ]
111
+ },
112
+ {
113
+ "steps": 2799921,
114
+ "file_path": "results/Huggy/Huggy/Huggy-2799921.onnx",
115
+ "reward": 3.8115060528119407,
116
+ "creation_time": 1707230660.7077575,
117
+ "auxillary_file_paths": [
118
+ "results/Huggy/Huggy/Huggy-2799921.pt"
119
+ ]
120
+ },
121
+ {
122
+ "steps": 2999908,
123
+ "file_path": "results/Huggy/Huggy/Huggy-2999908.onnx",
124
+ "reward": 3.62165554612875,
125
+ "creation_time": 1707230902.9507375,
126
+ "auxillary_file_paths": [
127
+ "results/Huggy/Huggy/Huggy-2999908.pt"
128
+ ]
129
+ },
130
+ {
131
+ "steps": 3000012,
132
+ "file_path": "results/Huggy/Huggy/Huggy-3000012.onnx",
133
+ "reward": 3.630279859052087,
134
+ "creation_time": 1707230903.0828722,
135
+ "auxillary_file_paths": [
136
+ "results/Huggy/Huggy/Huggy-3000012.pt"
137
+ ]
138
  }
139
  ],
140
  "final_checkpoint": {
141
+ "steps": 3000012,
142
  "file_path": "results/Huggy/Huggy.onnx",
143
+ "reward": 3.630279859052087,
144
+ "creation_time": 1707230903.0828722,
145
  "auxillary_file_paths": [
146
+ "results/Huggy/Huggy/Huggy-3000012.pt"
147
  ]
148
  }
149
  },