afonsosamarques's picture
Training in progress, step 3334
8a4fc46
{
"act_dim": 6,
"action_tanh": true,
"activation_function": "relu",
"adv_act_dim": 6,
"architectures": [
"VanillaDT"
],
"attn_pdrop": 0.1,
"bos_token_id": 50256,
"context_size": 20,
"embd_pdrop": 0.1,
"eos_token_id": 50256,
"flag": false,
"hidden_size": 128,
"initializer_range": 0.02,
"lambda1": 1.0,
"lambda2": 1.0,
"layer_norm_epsilon": 1e-05,
"log_interval_steps": 100,
"max_ep_len": 1000,
"max_ep_return": 4227,
"max_obs_len": 1000,
"max_obs_return": 4227,
"min_ep_return": -40.860974691808224,
"min_obs_return": -40.860974691808224,
"model_type": "decision_transformer",
"n_head": 1,
"n_inner": null,
"n_layer": 3,
"n_positions": 1024,
"pr_act_dim": 6,
"reorder_and_upcast_attn": false,
"resid_pdrop": 0.1,
"returns_scale": 1000,
"scale_attn_by_inverse_layer_idx": false,
"scale_attn_weights": true,
"state_dim": 17,
"state_mean": [
1.218962501630123,
0.14163528947484982,
-0.037049690418079276,
-0.13816565862287417,
0.5150924442392095,
-0.047190008896185874,
-0.4728192310128083,
0.04225571020440272,
2.394827945466415,
-0.03143244895598562,
0.04466346992652861,
-0.023907474073160472,
-0.10133977389419448,
0.09091033149985288,
-0.004192652549242934,
-0.12120530698001407,
-0.5496955076793073
],
"state_std": [
0.12314899816939005,
0.3243013276243093,
0.11457279298201731,
0.26230205605383794,
0.5641955092260325,
0.22723931119215887,
0.383823465370718,
0.7373887431190398,
1.23903653745177,
0.798316986357,
1.5671374062610388,
1.8108464431690363,
3.027126524702137,
4.064707182931284,
1.4600719051825006,
3.7459188910671553,
5.584324011405262
],
"torch_dtype": "float32",
"total_train_steps": 10000,
"transformers_version": "4.31.0",
"use_cache": true,
"vocab_size": 1,
"warmup_steps": 1000
}