alexandersoare commited on
Commit
2d132c1
1 Parent(s): c7f4e49

Upload folder using huggingface_hub

Browse files
pretrained_model/README.md ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Library: [More Information Needed]
9
+ - Docs: [More Information Needed]
pretrained_model/config.json ADDED
@@ -0,0 +1,50 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "advantage_scaling": 3.0,
3
+ "cem_iterations": 6,
4
+ "consistency_coeff": 20.0,
5
+ "discount": 0.98,
6
+ "elite_weighting_temperature": 0.5,
7
+ "expectile_weight": 0.9,
8
+ "gaussian_mean_momentum": 0.1,
9
+ "horizon": 5,
10
+ "image_encoder_hidden_dim": 32,
11
+ "input_normalization_modes": {
12
+ "observation.environment_state": "min_max",
13
+ "observation.state": "min_max"
14
+ },
15
+ "input_shapes": {
16
+ "observation.environment_state": [
17
+ 16
18
+ ],
19
+ "observation.state": [
20
+ 2
21
+ ]
22
+ },
23
+ "latent_dim": 50,
24
+ "max_random_shift_ratio": 0.0476,
25
+ "max_std": 2.0,
26
+ "min_std": 0.05,
27
+ "mlp_dim": 512,
28
+ "n_action_repeats": 1,
29
+ "n_action_steps": 5,
30
+ "n_elites": 50,
31
+ "n_gaussian_samples": 512,
32
+ "n_pi_samples": 51,
33
+ "output_normalization_modes": {
34
+ "action": "min_max"
35
+ },
36
+ "output_shapes": {
37
+ "action": [
38
+ 2
39
+ ]
40
+ },
41
+ "pi_coeff": 0.5,
42
+ "q_ensemble_size": 5,
43
+ "reward_coeff": 0.5,
44
+ "state_encoder_hidden_dim": 256,
45
+ "target_model_momentum": 0.995,
46
+ "temporal_decay_coeff": 0.5,
47
+ "uncertainty_regularizer_coeff": 1.0,
48
+ "use_mpc": true,
49
+ "value_coeff": 0.1
50
+ }
pretrained_model/config.yaml ADDED
@@ -0,0 +1,148 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ resume: false
2
+ device: cuda
3
+ use_amp: true
4
+ seed: 1
5
+ dataset_repo_id: lerobot/pusht_keypoints
6
+ video_backend: pyav
7
+ training:
8
+ offline_steps: 0
9
+ num_workers: 12
10
+ batch_size: 256
11
+ eval_freq: 10000
12
+ log_freq: 250
13
+ save_checkpoint: true
14
+ save_freq: 10000
15
+ online_steps: 1000000
16
+ online_steps_between_rollouts: 1000
17
+ online_rollout_n_episodes: 10
18
+ online_rollout_batch_size: 10
19
+ online_sampling_ratio: 1.0
20
+ online_env_seed: 10000
21
+ online_buffer_capacity: 40000
22
+ online_buffer_seed_size: 0
23
+ do_online_rollout_async: false
24
+ image_transforms:
25
+ enable: false
26
+ max_num_transforms: 3
27
+ random_order: false
28
+ brightness:
29
+ weight: 1
30
+ min_max:
31
+ - 0.8
32
+ - 1.2
33
+ contrast:
34
+ weight: 1
35
+ min_max:
36
+ - 0.8
37
+ - 1.2
38
+ saturation:
39
+ weight: 1
40
+ min_max:
41
+ - 0.5
42
+ - 1.5
43
+ hue:
44
+ weight: 1
45
+ min_max:
46
+ - -0.05
47
+ - 0.05
48
+ sharpness:
49
+ weight: 1
50
+ min_max:
51
+ - 0.8
52
+ - 1.2
53
+ grad_clip_norm: 10.0
54
+ lr: 0.0003
55
+ delta_timestamps:
56
+ observation.environment_state:
57
+ - 0.0
58
+ - 0.1
59
+ - 0.2
60
+ - 0.3
61
+ - 0.4
62
+ - 0.5
63
+ observation.state:
64
+ - 0.0
65
+ - 0.1
66
+ - 0.2
67
+ - 0.3
68
+ - 0.4
69
+ - 0.5
70
+ action:
71
+ - 0.0
72
+ - 0.1
73
+ - 0.2
74
+ - 0.3
75
+ - 0.4
76
+ next.reward:
77
+ - 0.0
78
+ - 0.1
79
+ - 0.2
80
+ - 0.3
81
+ - 0.4
82
+ eval:
83
+ n_episodes: 50
84
+ batch_size: 50
85
+ use_async_envs: true
86
+ wandb:
87
+ enable: true
88
+ disable_artifact: true
89
+ project: lerobot
90
+ notes: ''
91
+ fps: 10
92
+ env:
93
+ name: pusht
94
+ task: PushT-v0
95
+ image_size: 96
96
+ state_dim: 2
97
+ action_dim: 2
98
+ fps: ${fps}
99
+ episode_length: 300
100
+ gym:
101
+ obs_type: environment_state_agent_pos
102
+ render_mode: rgb_array
103
+ visualization_width: 384
104
+ visualization_height: 384
105
+ policy:
106
+ name: tdmpc
107
+ pretrained_model_path: null
108
+ n_action_repeats: 1
109
+ horizon: 5
110
+ n_action_steps: 5
111
+ input_shapes:
112
+ observation.environment_state:
113
+ - 16
114
+ observation.state:
115
+ - ${env.state_dim}
116
+ output_shapes:
117
+ action:
118
+ - ${env.action_dim}
119
+ input_normalization_modes:
120
+ observation.environment_state: min_max
121
+ observation.state: min_max
122
+ output_normalization_modes:
123
+ action: min_max
124
+ image_encoder_hidden_dim: 32
125
+ state_encoder_hidden_dim: 256
126
+ latent_dim: 50
127
+ q_ensemble_size: 5
128
+ mlp_dim: 512
129
+ discount: 0.98
130
+ use_mpc: true
131
+ cem_iterations: 6
132
+ max_std: 2.0
133
+ min_std: 0.05
134
+ n_gaussian_samples: 512
135
+ n_pi_samples: 51
136
+ uncertainty_regularizer_coeff: 1.0
137
+ n_elites: 50
138
+ elite_weighting_temperature: 0.5
139
+ gaussian_mean_momentum: 0.1
140
+ max_random_shift_ratio: 0.0476
141
+ reward_coeff: 0.5
142
+ expectile_weight: 0.9
143
+ value_coeff: 0.1
144
+ consistency_coeff: 20.0
145
+ advantage_scaling: 3.0
146
+ pi_coeff: 0.5
147
+ temporal_decay_coeff: 0.5
148
+ target_model_momentum: 0.995
pretrained_model/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c04290f1a030bb8a1441ccc343e4565e3a8f9cb6ca3ee3537042631a6e9cabf6
3
+ size 21456272
training_state.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a7913780b6fc3db69ab3ed33550306225e22353e84c3ea088dd3ebe30106be99
3
+ size 21529788