First Push

Browse files

Files changed (5) hide show

README.md +4 -4
config.json +1 -1
configuration.yaml +11 -24
run_logs/timers.json +345 -15
run_logs/training_status.json +58 -0

README.md CHANGED Viewed

@@ -1,14 +1,14 @@
 ---
 library_name: ml-agents
 tags:
-- Pyramids
 - deep-reinforcement-learning
 - reinforcement-learning
-- ML-Agents-Pyramids
 ---
-  # **ppo** Agent playing **Pyramids**
-  This is a trained model of a **ppo** agent playing **Pyramids**
   using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)

 ---
 library_name: ml-agents
 tags:
+- SnowballTarget
 - deep-reinforcement-learning
 - reinforcement-learning
+- ML-Agents-SnowballTarget
 ---
+  # **ppo** Agent playing **SnowballTarget**
+  This is a trained model of a **ppo** agent playing **SnowballTarget**
   using the [Unity ML-Agents Library](https://github.com/Unity-Technologies/ml-agents).
   ## Usage (with ML-Agents)

config.json CHANGED Viewed

@@ -1 +1 @@

- {"default_settings": null, "behaviors": {"~~Pyramids~~": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.01, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": ~~500000~~, "network_settings": {"normalize": false, "hidden_units": ~~512~~, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}, "rnd": {"gamma": 0.99, "strength": 0.01, "network_settings": {"normalize": false, "hidden_units": 64, "num_layers": 3, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "~~learning_rate": 0.0001, "encoding_size": null}}, "~~init_path": null, "keep_checkpoints": 5, "even_checkpoints": false, "max_steps": ~~1000000~~, "time_horizon": ~~128~~, "summary_freq": ~~30000~~, "threaded": ~~false~~, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/~~Pyramids~~/~~Pyramids~~", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "~~Pyramids Training~~", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

+ {"default_settings": null, "behaviors": {"SnowballTarget": {"trainer_type": "ppo", "hyperparameters": {"batch_size": 128, "buffer_size": 2048, "learning_rate": 0.0003, "beta": 0.005, "epsilon": 0.2, "lambd": 0.95, "num_epoch": 3, "shared_critic": false, "learning_rate_schedule": "linear", "beta_schedule": "linear", "epsilon_schedule": "linear"}, "checkpoint_interval": 50000, "network_settings": {"normalize": false, "hidden_units": 256, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}, "reward_signals": {"extrinsic": {"gamma": 0.99, "strength": 1.0, "network_settings": {"normalize": false, "hidden_units": 128, "num_layers": 2, "vis_encode_type": "simple", "memory": null, "goal_conditioning_type": "hyper", "deterministic": false}}}, "init_path": null, "keep_checkpoints": 10, "even_checkpoints": false, "max_steps": 200000, "time_horizon": 64, "summary_freq": 10000, "threaded": true, "self_play": null, "behavioral_cloning": null}}, "env_settings": {"env_path": "./training-envs-executables/linux/SnowballTarget/SnowballTarget", "env_args": null, "base_port": 5005, "num_envs": 1, "num_areas": 1, "timeout_wait": 60, "seed": -1, "max_lifetime_restarts": 10, "restarts_rate_limit_n": 1, "restarts_rate_limit_period_s": 60}, "engine_settings": {"width": 84, "height": 84, "quality_level": 5, "time_scale": 20, "target_frame_rate": -1, "capture_frame_rate": 60, "no_graphics": true, "no_graphics_monitor": false}, "environment_parameters": null, "checkpoint_settings": {"run_id": "SnowballTarget1", "initialize_from": null, "load_model": false, "resume": false, "force": false, "train_model": false, "inference": false, "results_dir": "results"}, "torch_settings": {"device": null}, "debug": false}

configuration.yaml CHANGED Viewed

@@ -1,12 +1,12 @@
 default_settings: null
 behaviors:
-  Pyramids:
     trainer_type: ppo
     hyperparameters:
       batch_size: 128
       buffer_size: 2048
       learning_rate: 0.0003
-      beta: 0.01
       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
@@ -14,10 +14,10 @@ behaviors:
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
-    checkpoint_interval: 500000
     network_settings:
       normalize: false
-      hidden_units: 512
       num_layers: 2
       vis_encode_type: simple
       memory: null
@@ -35,30 +35,17 @@ behaviors:
           memory: null
           goal_conditioning_type: hyper
           deterministic: false
-      rnd:
-        gamma: 0.99
-        strength: 0.01
-        network_settings:
-          normalize: false
-          hidden_units: 64
-          num_layers: 3
-          vis_encode_type: simple
-          memory: null
-          goal_conditioning_type: hyper
-          deterministic: false
-        learning_rate: 0.0001
-        encoding_size: null
     init_path: null
-    keep_checkpoints: 5
     even_checkpoints: false
-    max_steps: 1000000
-    time_horizon: 128
-    summary_freq: 30000
-    threaded: false
     self_play: null
     behavioral_cloning: null
 env_settings:
-  env_path: ./training-envs-executables/linux/Pyramids/Pyramids
   env_args: null
   base_port: 5005
   num_envs: 1
@@ -79,7 +66,7 @@ engine_settings:
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
-  run_id: Pyramids Training
   initialize_from: null
   load_model: false
   resume: false

 default_settings: null
 behaviors:
+  SnowballTarget:
     trainer_type: ppo
     hyperparameters:
       batch_size: 128
       buffer_size: 2048
       learning_rate: 0.0003
+      beta: 0.005
       epsilon: 0.2
       lambd: 0.95
       num_epoch: 3
       learning_rate_schedule: linear
       beta_schedule: linear
       epsilon_schedule: linear
+    checkpoint_interval: 50000
     network_settings:
       normalize: false
+      hidden_units: 256
       num_layers: 2
       vis_encode_type: simple
       memory: null
           memory: null
           goal_conditioning_type: hyper
           deterministic: false
     init_path: null
+    keep_checkpoints: 10
     even_checkpoints: false
+    max_steps: 200000
+    time_horizon: 64
+    summary_freq: 10000
+    threaded: true
     self_play: null
     behavioral_cloning: null
 env_settings:
+  env_path: ./training-envs-executables/linux/SnowballTarget/SnowballTarget
   env_args: null
   base_port: 5005
   num_envs: 1
   no_graphics_monitor: false
 environment_parameters: null
 checkpoint_settings:
+  run_id: SnowballTarget1
   initialize_from: null
   load_model: false
   resume: false

run_logs/timers.json CHANGED Viewed

@@ -1,45 +1,375 @@
 {
     "name": "root",
     "metadata": {
         "timer_format_version": "0.1.0",
-        "start_time_seconds": "1707941582",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
-        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.2.0+cu121",
         "numpy_version": "1.23.5",
-        "end_time_seconds": "1707941582"
     },
-    "total": 0.1519914749999316,
     "count": 1,
-    "self": 0.016260902999988502,
     "children": {
         "run_training.setup": {
-            "total": 0.07344121500000256,
             "count": 1,
-            "self": 0.07344121500000256
         },
         "TrainerController.start_learning": {
-            "total": 0.06228935699994054,
             "count": 1,
-            "self": 0.0007777309999710269,
             "children": {
                 "TrainerController._reset_env": {
-                    "total": 0.06149067399996966,
                     "count": 1,
-                    "self": 0.06149067399996966
                 },
                 "trainer_threads": {
-                    "total": 1.2639999340535724e-06,
                     "count": 1,
-                    "self": 1.2639999340535724e-06
                 },
                 "TrainerController._save_models": {
-                    "total": 1.9688000065798406e-05,
                     "count": 1,
-                    "self": 1.9688000065798406e-05
                 }
             }
         }

 {
     "name": "root",
+    "gauges": {
+        "SnowballTarget.Policy.Entropy.mean": {
+            "value": 0.9914730787277222,
+            "min": 0.9914730787277222,
+            "max": 2.873957633972168,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Entropy.sum": {
+            "value": 9499.3037109375,
+            "min": 9499.3037109375,
+            "max": 29495.427734375,
+            "count": 20
+        },
+        "SnowballTarget.Step.mean": {
+            "value": 199984.0,
+            "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
+        },
+        "SnowballTarget.Step.sum": {
+            "value": 199984.0,
+            "min": 9952.0,
+            "max": 199984.0,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
+            "value": 12.96503734588623,
+            "min": 0.3656828999519348,
+            "max": 12.96503734588623,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
+            "value": 2528.182373046875,
+            "min": 70.9424819946289,
+            "max": 2602.71875,
+            "count": 20
+        },
+        "SnowballTarget.Environment.EpisodeLength.mean": {
+            "value": 199.0,
+            "min": 199.0,
+            "max": 199.0,
+            "count": 20
+        },
+        "SnowballTarget.Environment.EpisodeLength.sum": {
+            "value": 8756.0,
+            "min": 8756.0,
+            "max": 10945.0,
+            "count": 20
+        },
+        "SnowballTarget.Losses.PolicyLoss.mean": {
+            "value": 0.06374345075849253,
+            "min": 0.06169963288562476,
+            "max": 0.07582122400430415,
+            "count": 20
+        },
+        "SnowballTarget.Losses.PolicyLoss.sum": {
+            "value": 0.2549738030339701,
+            "min": 0.24679853154249903,
+            "max": 0.36523728684508516,
+            "count": 20
+        },
+        "SnowballTarget.Losses.ValueLoss.mean": {
+            "value": 0.20116959263881046,
+            "min": 0.09848128757256941,
+            "max": 0.2898164811525859,
+            "count": 20
+        },
+        "SnowballTarget.Losses.ValueLoss.sum": {
+            "value": 0.8046783705552418,
+            "min": 0.39392515029027764,
+            "max": 1.3678632022119035,
+            "count": 20
+        },
+        "SnowballTarget.Policy.LearningRate.mean": {
+            "value": 8.082097306000005e-06,
+            "min": 8.082097306000005e-06,
+            "max": 0.000291882002706,
+            "count": 20
+        },
+        "SnowballTarget.Policy.LearningRate.sum": {
+            "value": 3.232838922400002e-05,
+            "min": 3.232838922400002e-05,
+            "max": 0.00138516003828,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Epsilon.mean": {
+            "value": 0.10269400000000001,
+            "min": 0.10269400000000001,
+            "max": 0.19729400000000002,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Epsilon.sum": {
+            "value": 0.41077600000000003,
+            "min": 0.41077600000000003,
+            "max": 0.96172,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Beta.mean": {
+            "value": 0.0001444306000000001,
+            "min": 0.0001444306000000001,
+            "max": 0.0048649706,
+            "count": 20
+        },
+        "SnowballTarget.Policy.Beta.sum": {
+            "value": 0.0005777224000000004,
+            "min": 0.0005777224000000004,
+            "max": 0.023089828,
+            "count": 20
+        },
+        "SnowballTarget.Environment.CumulativeReward.mean": {
+            "value": 25.886363636363637,
+            "min": 2.8636363636363638,
+            "max": 25.886363636363637,
+            "count": 20
+        },
+        "SnowballTarget.Environment.CumulativeReward.sum": {
+            "value": 1139.0,
+            "min": 126.0,
+            "max": 1393.0,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicReward.mean": {
+            "value": 25.886363636363637,
+            "min": 2.8636363636363638,
+            "max": 25.886363636363637,
+            "count": 20
+        },
+        "SnowballTarget.Policy.ExtrinsicReward.sum": {
+            "value": 1139.0,
+            "min": 126.0,
+            "max": 1393.0,
+            "count": 20
+        },
+        "SnowballTarget.IsTraining.mean": {
+            "value": 1.0,
+            "min": 1.0,
+            "max": 1.0,
+            "count": 20
+        },
+        "SnowballTarget.IsTraining.sum": {
+            "value": 1.0,
+            "min": 1.0,
+            "max": 1.0,
+            "count": 20
+        }
+    },
     "metadata": {
         "timer_format_version": "0.1.0",
+        "start_time_seconds": "1707941657",
         "python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
+        "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics",
         "mlagents_version": "1.1.0.dev0",
         "mlagents_envs_version": "1.1.0.dev0",
         "communication_protocol_version": "1.5.0",
         "pytorch_version": "2.2.0+cu121",
         "numpy_version": "1.23.5",
+        "end_time_seconds": "1707942274"
     },
+    "total": 616.9848276049999,
     "count": 1,
+    "self": 0.5305121579997376,
     "children": {
         "run_training.setup": {
+            "total": 0.07121669399998609,
             "count": 1,
+            "self": 0.07121669399998609
         },
         "TrainerController.start_learning": {
+            "total": 616.3830987530001,
             "count": 1,
+            "self": 0.9253966029928051,
             "children": {
                 "TrainerController._reset_env": {
+                    "total": 4.86483831399994,
                     "count": 1,
+                    "self": 4.86483831399994
+                },
+                "TrainerController.advance": {
+                    "total": 610.4914103100073,
+                    "count": 18203,
+                    "self": 0.44134618003295145,
+                    "children": {
+                        "env_step": {
+                            "total": 610.0500641299743,
+                            "count": 18203,
+                            "self": 469.4286792179771,
+                            "children": {
+                                "SubprocessEnvManager._take_step": {
+                                    "total": 140.18064394098474,
+                                    "count": 18203,
+                                    "self": 2.7716976129713657,
+                                    "children": {
+                                        "TorchPolicy.evaluate": {
+                                            "total": 137.40894632801337,
+                                            "count": 18203,
+                                            "self": 137.40894632801337
+                                        }
+                                    }
+                                },
+                                "workers": {
+                                    "total": 0.4407409710124739,
+                                    "count": 18203,
+                                    "self": 0.0,
+                                    "children": {
+                                        "worker_root": {
+                                            "total": 614.3191371800239,
+                                            "count": 18203,
+                                            "is_parallel": true,
+                                            "self": 289.1690472830177,
+                                            "children": {
+                                                "run_training.setup": {
+                                                    "total": 0.0,
+                                                    "count": 0,
+                                                    "is_parallel": true,
+                                                    "self": 0.0,
+                                                    "children": {
+                                                        "steps_from_proto": {
+                                                            "total": 0.007789372000047479,
+                                                            "count": 1,
+                                                            "is_parallel": true,
+                                                            "self": 0.0055618820002791836,
+                                                            "children": {
+                                                                "_process_rank_one_or_two_observation": {
+                                                                    "total": 0.002227489999768295,
+                                                                    "count": 10,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.002227489999768295
+                                                                }
+                                                            }
+                                                        },
+                                                        "UnityEnvironment.step": {
+                                                            "total": 0.05753250100008245,
+                                                            "count": 1,
+                                                            "is_parallel": true,
+                                                            "self": 0.0026428850000002058,
+                                                            "children": {
+                                                                "UnityEnvironment._generate_step_input": {
+                                                                    "total": 0.0005031310000731537,
+                                                                    "count": 1,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.0005031310000731537
+                                                                },
+                                                                "communicator.exchange": {
+                                                                    "total": 0.04731931200001327,
+                                                                    "count": 1,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.04731931200001327
+                                                                },
+                                                                "steps_from_proto": {
+                                                                    "total": 0.007067172999995819,
+                                                                    "count": 1,
+                                                                    "is_parallel": true,
+                                                                    "self": 0.0005673890000252868,
+                                                                    "children": {
+                                                                        "_process_rank_one_or_two_observation": {
+                                                                            "total": 0.006499783999970532,
+                                                                            "count": 10,
+                                                                            "is_parallel": true,
+                                                                            "self": 0.006499783999970532
+                                                                        }
+                                                                    }
+                                                                }
+                                                            }
+                                                        }
+                                                    }
+                                                },
+                                                "UnityEnvironment.step": {
+                                                    "total": 325.1500898970062,
+                                                    "count": 18202,
+                                                    "is_parallel": true,
+                                                    "self": 15.278682513998433,
+                                                    "children": {
+                                                        "UnityEnvironment._generate_step_input": {
+                                                            "total": 7.886213973984923,
+                                                            "count": 18202,
+                                                            "is_parallel": true,
+                                                            "self": 7.886213973984923
+                                                        },
+                                                        "communicator.exchange": {
+                                                            "total": 255.72345804001293,
+                                                            "count": 18202,
+                                                            "is_parallel": true,
+                                                            "self": 255.72345804001293
+                                                        },
+                                                        "steps_from_proto": {
+                                                            "total": 46.2617353690099,
+                                                            "count": 18202,
+                                                            "is_parallel": true,
+                                                            "self": 9.199899673961909,
+                                                            "children": {
+                                                                "_process_rank_one_or_two_observation": {
+                                                                    "total": 37.06183569504799,
+                                                                    "count": 182020,
+                                                                    "is_parallel": true,
+                                                                    "self": 37.06183569504799
+                                                                }
+                                                            }
+                                                        }
+                                                    }
+                                                }
+                                            }
+                                        }
+                                    }
+                                }
+                            }
+                        }
+                    }
                 },
                 "trainer_threads": {
+                    "total": 0.00013422500001070148,
                     "count": 1,
+                    "self": 0.00013422500001070148,
+                    "children": {
+                        "thread_root": {
+                            "total": 0.0,
+                            "count": 0,
+                            "is_parallel": true,
+                            "self": 0.0,
+                            "children": {
+                                "trainer_advance": {
+                                    "total": 603.3576001671316,
+                                    "count": 787096,
+                                    "is_parallel": true,
+                                    "self": 18.87754923110151,
+                                    "children": {
+                                        "process_trajectory": {
+                                            "total": 321.9403706180301,
+                                            "count": 787096,
+                                            "is_parallel": true,
+                                            "self": 321.37840758902985,
+                                            "children": {
+                                                "RLTrainer._checkpoint": {
+                                                    "total": 0.5619630290002533,
+                                                    "count": 4,
+                                                    "is_parallel": true,
+                                                    "self": 0.5619630290002533
+                                                }
+                                            }
+                                        },
+                                        "_update_policy": {
+                                            "total": 262.539680318,
+                                            "count": 90,
+                                            "is_parallel": true,
+                                            "self": 68.92569046499761,
+                                            "children": {
+                                                "TorchPPOOptimizer.update": {
+                                                    "total": 193.6139898530024,
+                                                    "count": 4587,
+                                                    "is_parallel": true,
+                                                    "self": 193.6139898530024
+                                                }
+                                            }
+                                        }
+                                    }
+                                }
+                            }
+                        }
+                    }
                 },
                 "TrainerController._save_models": {
+                    "total": 0.10131930100010322,
                     "count": 1,
+                    "self": 0.0012558180001178698,
+                    "children": {
+                        "RLTrainer._checkpoint": {
+                            "total": 0.10006348299998535,
+                            "count": 1,
+                            "self": 0.10006348299998535
+                        }
+                    }
                 }
             }
         }

run_logs/training_status.json CHANGED Viewed

@@ -1,4 +1,62 @@
 {
     "metadata": {
         "stats_format_version": "0.3.0",
         "mlagents_version": "1.1.0.dev0",

 {
+    "SnowballTarget": {
+        "checkpoints": [
+            {
+                "steps": 49936,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.onnx",
+                "reward": 12.545454545454545,
+                "creation_time": 1707941813.3585904,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-49936.pt"
+                ]
+            },
+            {
+                "steps": 99960,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.onnx",
+                "reward": 20.272727272727273,
+                "creation_time": 1707941968.323758,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-99960.pt"
+                ]
+            },
+            {
+                "steps": 149984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.onnx",
+                "reward": 24.727272727272727,
+                "creation_time": 1707942119.6343586,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-149984.pt"
+                ]
+            },
+            {
+                "steps": 199984,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.onnx",
+                "reward": 25.272727272727273,
+                "creation_time": 1707942273.4143367,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-199984.pt"
+                ]
+            },
+            {
+                "steps": 200112,
+                "file_path": "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.onnx",
+                "reward": 25.272727272727273,
+                "creation_time": 1707942273.5439253,
+                "auxillary_file_paths": [
+                    "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
+                ]
+            }
+        ],
+        "final_checkpoint": {
+            "steps": 200112,
+            "file_path": "results/SnowballTarget1/SnowballTarget.onnx",
+            "reward": 25.272727272727273,
+            "creation_time": 1707942273.5439253,
+            "auxillary_file_paths": [
+                "results/SnowballTarget1/SnowballTarget/SnowballTarget-200112.pt"
+            ]
+        }
+    },
     "metadata": {
         "stats_format_version": "0.3.0",
         "mlagents_version": "1.1.0.dev0",