Kano001 commited on
Commit
fbb2a8b
1 Parent(s): 0bec4af

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +86 -0
README.md CHANGED
@@ -4,4 +4,90 @@ tags:
4
  - deep-reinforcement-learning
5
  - reinforcement-learning
6
  - ml-agents
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7
  ---
 
4
  - deep-reinforcement-learning
5
  - reinforcement-learning
6
  - ml-agents
7
+
8
+ environment:
9
+ - CollectCoin
10
+
11
+
12
+ ---
13
+
14
+ # Collect Coin, a environment for ML-Agent made by Brijesh Tejani
15
+
16
+ ### Config File
17
+ `behaviors:
18
+ CollectCoin:
19
+ trainer_type: ppo
20
+ hyperparameters:
21
+ batch_size: 1024
22
+ buffer_size: 10240
23
+ learning_rate: 0.0003
24
+ beta: 0.005
25
+ epsilon: 0.2
26
+ lambd: 0.95
27
+ num_epoch: 3
28
+ shared_critic: false
29
+ learning_rate_schedule: linear
30
+ beta_schedule: linear
31
+ epsilon_schedule: linear
32
+ network_settings:
33
+ normalize: false
34
+ hidden_units: 128
35
+ num_layers: 2
36
+ vis_encode_type: simple
37
+ memory: null
38
+ goal_conditioning_type: hyper
39
+ deterministic: false
40
+ reward_signals:
41
+ extrinsic:
42
+ gamma: 0.99
43
+ strength: 1.0
44
+ network_settings:
45
+ normalize: false
46
+ hidden_units: 128
47
+ num_layers: 2
48
+ vis_encode_type: simple
49
+ memory: null
50
+ goal_conditioning_type: hyper
51
+ deterministic: false
52
+ init_path: null
53
+ keep_checkpoints: 5
54
+ checkpoint_interval: 500000
55
+ max_steps: 2500000
56
+ time_horizon: 64
57
+ summary_freq: 50000
58
+ threaded: false
59
+ self_play: null
60
+ behavioral_cloning: null
61
+ env_settings:
62
+ env_path: null
63
+ env_args: null
64
+ base_port: 5005
65
+ num_envs: 1
66
+ num_areas: 1
67
+ seed: -1
68
+ max_lifetime_restarts: 10
69
+ restarts_rate_limit_n: 1
70
+ restarts_rate_limit_period_s: 60
71
+ engine_settings:
72
+ width: 84
73
+ height: 84
74
+ quality_level: 5
75
+ time_scale: 20
76
+ target_frame_rate: -1
77
+ capture_frame_rate: 60
78
+ no_graphics: false
79
+ environment_parameters: null
80
+ checkpoint_settings:
81
+ run_id: '001'
82
+ initialize_from: null
83
+ load_model: false
84
+ resume: false
85
+ force: false
86
+ train_model: false
87
+ inference: false
88
+ results_dir: results
89
+ torch_settings:
90
+ device: null
91
+ debug: false
92
+ `
93
  ---