ahalev commited on
Commit
caf33a8
1 Parent(s): 5a2060e

Upload config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.yaml +164 -0
config.yaml ADDED
@@ -0,0 +1,164 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ algo:
2
+ ddpg:
3
+ params:
4
+ target_update_tau: 0.01
5
+ policy:
6
+ exploration:
7
+ sigma: 0.3
8
+ theta: 0.15
9
+ deterministic_params:
10
+ buffer_batch_size: 32
11
+ min_buffer_size: 10000
12
+ n_train_steps: 500
13
+ qf_lr: 0.0001
14
+ steps_per_epoch: 1
15
+ dqn:
16
+ params:
17
+ clip_gradient: 10
18
+ deterministic_eval: true
19
+ double_q: false
20
+ target_update_freq: 2
21
+ policy:
22
+ exploration:
23
+ decay_ratio: 0.5
24
+ max_epsilon: 1.0
25
+ min_epsilon: 0.05
26
+ general_params:
27
+ discount: 0.99
28
+ package: garage
29
+ policy:
30
+ hidden_sizes:
31
+ - 128
32
+ - 128
33
+ pretrained_policy: null
34
+ ppo:
35
+ params:
36
+ center_adv: false
37
+ num_train_per_epoch: 1
38
+ tanhnormal: false
39
+ pretrain:
40
+ additional_config: null
41
+ algo_to_pretrain: null
42
+ params:
43
+ episodes_per_batch: 10
44
+ loss: log_prob
45
+ policy_lr: 0.01
46
+ pretrain_algo: rbc
47
+ replay_buffer:
48
+ buffer_size: 200000
49
+ rnd:
50
+ batch_size: 64
51
+ bound_reward_weight: cosine
52
+ bound_reward_weight_initial_ratio: 0.999999
53
+ bound_reward_weight_transient_epochs: 10
54
+ hidden_sizes:
55
+ - 64
56
+ - 64
57
+ intrinsic_reward_weight: 0.0001
58
+ n_train_steps: 32
59
+ output_dim: 128
60
+ predictor_lr: 0.001
61
+ standardize_extrinsic_reward: true
62
+ standardize_intrinsic_reward: true
63
+ sampler:
64
+ n_workers: 16
65
+ type: ray
66
+ train:
67
+ batch_size: 50000
68
+ gpu_id: 0
69
+ n_epochs: 100
70
+ steps_per_epoch: 32
71
+ use_gpu: false
72
+ type: ppo
73
+ context:
74
+ disable_logging: false
75
+ experiment_name: null
76
+ log_dir:
77
+ from_keys:
78
+ - microgrid.config.scenario
79
+ - microgrid.methods.set_forecaster.forecaster
80
+ - microgrid.methods.set_module_attrs.battery_transition_model
81
+ - context.seed
82
+ - env.domain_randomization.noise_std
83
+ - algo.ppo.tanhnormal
84
+ - algo.rnd.intrinsic_reward_weight
85
+ parent: /home/ahalev/data/GridRL/paper_experiments
86
+ use_existing_dir: false
87
+ seed: 42
88
+ snapshot_gap: 10
89
+ verbose: 0
90
+ wandb:
91
+ api_key_file: ../../local/wandb_api_key.txt
92
+ group: null
93
+ log_density: 1
94
+ plot_baseline:
95
+ - mpc
96
+ - rbc
97
+ username: ahalev
98
+ env:
99
+ cls: DiscreteMicrogridEnv
100
+ domain_randomization:
101
+ noise_std: 0.01
102
+ relative_noise: true
103
+ forced_genset: null
104
+ net_load:
105
+ slack_module: grid
106
+ use: true
107
+ observation_keys:
108
+ - soc
109
+ - net_load
110
+ - import_price_current
111
+ - import_price_forecast_0
112
+ - import_price_forecast_1
113
+ - import_price_forecast_2
114
+ - import_price_forecast_3
115
+ - import_price_forecast_4
116
+ - import_price_forecast_5
117
+ - import_price_forecast_6
118
+ - import_price_forecast_7
119
+ - import_price_forecast_8
120
+ - import_price_forecast_9
121
+ - import_price_forecast_10
122
+ - import_price_forecast_11
123
+ - import_price_forecast_12
124
+ - import_price_forecast_13
125
+ - import_price_forecast_14
126
+ - import_price_forecast_15
127
+ - import_price_forecast_16
128
+ - import_price_forecast_17
129
+ - import_price_forecast_18
130
+ - import_price_forecast_19
131
+ - import_price_forecast_20
132
+ - import_price_forecast_21
133
+ - import_price_forecast_22
134
+ microgrid:
135
+ attributes:
136
+ reward_shaping_func: !BaselineShaper
137
+ baseline_module: false
138
+ module:
139
+ - grid
140
+ - 0
141
+ config:
142
+ scenario: 4
143
+ methods:
144
+ set_forecaster:
145
+ forecast_horizon: 23
146
+ forecaster: 0.0
147
+ forecaster_increase_uncertainty: true
148
+ forecaster_relative_noise: true
149
+ set_module_attrs:
150
+ battery_transition_model: null
151
+ normalized_action_bounds:
152
+ - 0.0
153
+ - 1.0
154
+ trajectory:
155
+ evaluate:
156
+ final_step: -1
157
+ initial_step: 5840
158
+ trajectory_func: null
159
+ train:
160
+ final_step: 5840
161
+ initial_step: 0
162
+ trajectory_func: !FixedLengthStochasticTrajectory
163
+ trajectory_length: 720
164
+ verbose: 1