|
{ |
|
"act_dim": 6, |
|
"action_tanh": true, |
|
"activation_function": "relu", |
|
"adv_act_dim": 6, |
|
"architectures": [ |
|
"VanillaDT" |
|
], |
|
"attn_pdrop": 0.1, |
|
"bos_token_id": 50256, |
|
"context_size": 20, |
|
"embd_pdrop": 0.1, |
|
"eos_token_id": 50256, |
|
"flag": false, |
|
"hidden_size": 128, |
|
"initializer_range": 0.02, |
|
"lambda1": 1.0, |
|
"lambda2": 1.0, |
|
"layer_norm_epsilon": 1e-05, |
|
"log_interval_steps": 100, |
|
"max_ep_len": 1000, |
|
"max_ep_return": 4227, |
|
"max_obs_len": 1000, |
|
"max_obs_return": 4227, |
|
"min_ep_return": -40.860974691808224, |
|
"min_obs_return": -40.860974691808224, |
|
"model_type": "decision_transformer", |
|
"n_head": 1, |
|
"n_inner": null, |
|
"n_layer": 3, |
|
"n_positions": 1024, |
|
"pr_act_dim": 6, |
|
"reorder_and_upcast_attn": false, |
|
"resid_pdrop": 0.1, |
|
"returns_scale": 1000, |
|
"scale_attn_by_inverse_layer_idx": false, |
|
"scale_attn_weights": true, |
|
"state_dim": 17, |
|
"state_mean": [ |
|
1.218962501630123, |
|
0.14163528947484982, |
|
-0.037049690418079276, |
|
-0.13816565862287417, |
|
0.5150924442392095, |
|
-0.047190008896185874, |
|
-0.4728192310128083, |
|
0.04225571020440272, |
|
2.394827945466415, |
|
-0.03143244895598562, |
|
0.04466346992652861, |
|
-0.023907474073160472, |
|
-0.10133977389419448, |
|
0.09091033149985288, |
|
-0.004192652549242934, |
|
-0.12120530698001407, |
|
-0.5496955076793073 |
|
], |
|
"state_std": [ |
|
0.12314899816939005, |
|
0.3243013276243093, |
|
0.11457279298201731, |
|
0.26230205605383794, |
|
0.5641955092260325, |
|
0.22723931119215887, |
|
0.383823465370718, |
|
0.7373887431190398, |
|
1.23903653745177, |
|
0.798316986357, |
|
1.5671374062610388, |
|
1.8108464431690363, |
|
3.027126524702137, |
|
4.064707182931284, |
|
1.4600719051825006, |
|
3.7459188910671553, |
|
5.584324011405262 |
|
], |
|
"torch_dtype": "float32", |
|
"total_train_steps": 10000, |
|
"transformers_version": "4.31.0", |
|
"use_cache": true, |
|
"vocab_size": 1, |
|
"warmup_steps": 1000 |
|
} |
|
|