Bbyaz commited on
Commit
72ace65
1 Parent(s): fd1906f

Grasping model for table clearing depth input (#1)

Browse files

- model: table clearing grasping model (ae179daf3743edb4789c3b9c1b98d922a2966279)

SAC_1m_table_clearing/SAC_10m_table.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7dea64249ea4816a88eac6f6c738550dc79aefa3fb07cb999ef2a67e07f0ac5e
3
+ size 8051409
SAC_1m_table_clearing/best_model/best_model.zip ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f50ee824ce420c3c48df193ee8bc5a9de127feaadc2655281c4c017b754ace4e
3
+ size 8051409
SAC_1m_table_clearing/best_model/config.yaml ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ BDQ:
2
+ batch_size: 64
3
+ buffer_size: 1000000
4
+ epsilon_greedy: true
5
+ exploration_final_eps: 0.1
6
+ exploration_fraction: 0.3
7
+ layers:
8
+ - [64, 64]
9
+ - [32]
10
+ - [32]
11
+ learning_rate: 0.0001
12
+ learning_starts: 1000
13
+ num_actions_pad: 33
14
+ prioritized_replay: false
15
+ save_dir: BDQ1mSimplified
16
+ target_network_update_freq: 1000
17
+ tensorboard_logs: null
18
+ total_timesteps: 4000000
19
+ DDPG: {save_dir: DDPG, tensorboard_logs: DDPG, total_timesteps: 2000000}
20
+ DQN: {batch_size: 32, learning_rate: 0.001, prioritized_replay: true, save_dir: DQN4mFull,
21
+ tensorboard_logs: null, total_timesteps: 4000000}
22
+ PPO: {learning_rate: 0.001, n_steps: 2000, save_dir: ppo_5m, tensorboard_logs: tensorboard_logs/ppo_5m,
23
+ total_timesteps: 1000000}
24
+ SAC:
25
+ batch_size: 64
26
+ buffer_size: 1000000
27
+ layers: [64, 64]
28
+ max_iters: 400
29
+ save_dir: SAC_10m_table
30
+ step_size: 0.0003
31
+ tensorboard_logs: null
32
+ total_timesteps: 10000000
33
+ TRPO: {batch_size: 64, max_iters: 400, save_dir: trpo_1m, step_size: 0.001, tensorboard_logs: tensorboard_logs/trpo_1m,
34
+ total_timesteps: 5000000}
35
+ algorithm: sac
36
+ curriculum:
37
+ extent: [0.01, 0.1]
38
+ init_lambda: 0.0
39
+ lift_dist: [0.015, 0.1]
40
+ max_objects: [1, 5]
41
+ min_objects: [1, 1]
42
+ n_steps: 8
43
+ robot_height: [0.15, 0.25]
44
+ success_threshold: 0.7
45
+ window_size: 1000
46
+ depth_observation: true
47
+ discount_factor: 0.99
48
+ full_observation: false
49
+ normalize: true
50
+ reward: {custom: true, delta_z_scale: 1000.0, grasp_reward: 100.0, shaped: true, terminal_reward: 10000.0,
51
+ time_penalty: 200.0, table_clearing: True}
52
+ robot: {discrete: false, max_force: 100, max_translation: 0.05, max_yaw_rotation: 0.20,
53
+ model_path: models/gripper/wsg50_one_motor_gripper_new.sdf, num_actions_pad: 2,
54
+ step_size: 0.01, yaw_step: 0.1}
55
+ scene: {data_set: random_urdfs, scene_type: OnTable}
56
+ sensor:
57
+ camera_info: config/camera_info.yaml
58
+ encoder_dir: encoder_files/new_gripper_encoder
59
+ randomize: {focal_length: 4, optical_center: 2, rotation: 0.0349, translation: 0.002}
60
+ transform: config/camera_transform.yaml
61
+ visualize: false
62
+ simplified: false
63
+ simulation: {real_time: false, visualize: false}
64
+ skip_empty_initial_state: true
65
+ time_horizon: 200
SAC_1m_table_clearing/best_model/logs/evaluations.npz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b929cacf83bdc30ff352918ee9b6956e2611ddf2d536b4abeea376ce7f8f669d
3
+ size 26370
SAC_1m_table_clearing/best_model/vecnormalize.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bb993568ad3fe89117e99cb52cd4bf904ac1c97f57c94cc13271a6937012d5b7
3
+ size 252579
SAC_1m_table_clearing/config.yaml ADDED
@@ -0,0 +1,65 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ BDQ:
2
+ batch_size: 64
3
+ buffer_size: 1000000
4
+ epsilon_greedy: true
5
+ exploration_final_eps: 0.1
6
+ exploration_fraction: 0.3
7
+ layers:
8
+ - [64, 64]
9
+ - [32]
10
+ - [32]
11
+ learning_rate: 0.0001
12
+ learning_starts: 1000
13
+ num_actions_pad: 33
14
+ prioritized_replay: false
15
+ save_dir: BDQ1mSimplified
16
+ target_network_update_freq: 1000
17
+ tensorboard_logs: null
18
+ total_timesteps: 4000000
19
+ DDPG: {save_dir: DDPG, tensorboard_logs: DDPG, total_timesteps: 2000000}
20
+ DQN: {batch_size: 32, learning_rate: 0.001, prioritized_replay: true, save_dir: DQN4mFull,
21
+ tensorboard_logs: null, total_timesteps: 4000000}
22
+ PPO: {learning_rate: 0.001, n_steps: 2000, save_dir: ppo_5m, tensorboard_logs: tensorboard_logs/ppo_5m,
23
+ total_timesteps: 1000000}
24
+ SAC:
25
+ batch_size: 64
26
+ buffer_size: 1000000
27
+ layers: [64, 64]
28
+ max_iters: 400
29
+ save_dir: SAC_10m_table
30
+ step_size: 0.0003
31
+ tensorboard_logs: null
32
+ total_timesteps: 10000000
33
+ TRPO: {batch_size: 64, max_iters: 400, save_dir: trpo_1m, step_size: 0.001, tensorboard_logs: tensorboard_logs/trpo_1m,
34
+ total_timesteps: 5000000}
35
+ algorithm: sac
36
+ curriculum:
37
+ extent: [0.01, 0.1]
38
+ init_lambda: 0.0
39
+ lift_dist: [0.015, 0.1]
40
+ max_objects: [1, 5]
41
+ min_objects: [1, 1]
42
+ n_steps: 8
43
+ robot_height: [0.15, 0.25]
44
+ success_threshold: 0.7
45
+ window_size: 1000
46
+ depth_observation: true
47
+ discount_factor: 0.99
48
+ full_observation: false
49
+ normalize: true
50
+ reward: {custom: true, delta_z_scale: 1000.0, grasp_reward: 100.0, shaped: true, terminal_reward: 10000.0,
51
+ time_penalty: 200.0}
52
+ robot: {discrete: false, max_force: 100, max_translation: 0.03, max_yaw_rotation: 0.15,
53
+ model_path: models/gripper/wsg50_one_motor_gripper_new.sdf, num_actions_pad: 2,
54
+ step_size: 0.01, yaw_step: 0.1}
55
+ scene: {data_set: random_urdfs, scene_type: OnTable}
56
+ sensor:
57
+ camera_info: config/camera_info.yaml
58
+ encoder_dir: encoder_files/new_gripper_encoder
59
+ randomize: {focal_length: 4, optical_center: 2, rotation: 0.0349, translation: 0.002}
60
+ transform: config/camera_transform.yaml
61
+ visualize: false
62
+ simplified: false
63
+ simulation: {real_time: false, visualize: false}
64
+ skip_empty_initial_state: true
65
+ time_horizon: 200
SAC_1m_table_clearing/log_file.monitor.csv ADDED
The diff for this file is too large to render. See raw diff
 
SAC_1m_table_clearing/vecnormalize.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a33d56ecf250e61c8eef396a5e9813d14c721ce6221f278eaba05af768e4e3c
3
+ size 252579