File size: 6,246 Bytes
62e03a2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
2023-04-04 16:19:39 - r - INFO: - Hyperparameters:
2023-04-04 16:19:39 - r - INFO: - ================================================================================
2023-04-04 16:19:39 - r - INFO: -         Name        	       Value        	        Type        
2023-04-04 16:19:39 - r - INFO: -       env_name      	LunarLanderContinuous-v2	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -      continuous     	         1          	   <class 'bool'>   
2023-04-04 16:19:39 - r - INFO: -     new_step_api    	         1          	   <class 'bool'>   
2023-04-04 16:19:39 - r - INFO: -       wrapper       	        None        	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -        render       	         1          	   <class 'bool'>   
2023-04-04 16:19:39 - r - INFO: -      algo_name      	        SAC         	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -         mode        	        test        	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -     render_mode     	       human        	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -      mp_backend     	         mp         	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -         seed        	        666         	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -        device       	        cpu         	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -      train_eps      	        2000        	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -       test_eps      	         20         	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -       eval_eps      	         10         	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -   eval_per_episode  	         5          	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -      max_steps      	        500         	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -   load_checkpoint   	         1          	   <class 'bool'>   
2023-04-04 16:19:39 - r - INFO: -      load_path      	Train_LunarLanderContinuous-v2_SAC_20230402-170158	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -       show_fig      	         0          	   <class 'bool'>   
2023-04-04 16:19:39 - r - INFO: -       save_fig      	         1          	   <class 'bool'>   
2023-04-04 16:19:39 - r - INFO: -     policy_type     	      Gaussian      	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -          lr         	       0.001        	  <class 'float'>   
2023-04-04 16:19:39 - r - INFO: -        gamma        	        0.99        	  <class 'float'>   
2023-04-04 16:19:39 - r - INFO: -         tau         	       0.005        	  <class 'float'>   
2023-04-04 16:19:39 - r - INFO: -        alpha        	        0.2         	  <class 'float'>   
2023-04-04 16:19:39 - r - INFO: - automatic_entropy_tuning	         0          	   <class 'bool'>   
2023-04-04 16:19:39 - r - INFO: -      batch_size     	         64         	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -      hidden_dim     	        256         	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -       n_epochs      	         1          	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -     start_steps     	       10000        	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -  target_update_fre  	         1          	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -     buffer_size     	      1000000       	   <class 'int'>    
2023-04-04 16:19:39 - r - INFO: -       task_dir      	G:\Python3\RL\Pytorch\joyrl-offline-main/tasks/Test_LunarLanderContinuous-v2_SAC_20230404-161934	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -       res_dir       	G:\Python3\RL\Pytorch\joyrl-offline-main/tasks/Test_LunarLanderContinuous-v2_SAC_20230404-161934/results	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -       log_dir       	G:\Python3\RL\Pytorch\joyrl-offline-main/tasks/Test_LunarLanderContinuous-v2_SAC_20230404-161934/logs	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -       traj_dir      	G:\Python3\RL\Pytorch\joyrl-offline-main/tasks/Test_LunarLanderContinuous-v2_SAC_20230404-161934/traj	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: -        tb_dir       	G:\Python3\RL\Pytorch\joyrl-offline-main/tasks/Test_LunarLanderContinuous-v2_SAC_20230404-161934/tb_logs	   <class 'str'>    
2023-04-04 16:19:39 - r - INFO: - ================================================================================
2023-04-04 16:19:39 - r - INFO: - action_bound: 1.0
2023-04-04 16:19:39 - r - INFO: - n_states: 8, n_actions: 2
2023-04-04 16:19:39 - r - INFO: - Start testing!
2023-04-04 16:19:39 - r - INFO: - Env: LunarLanderContinuous-v2, Algorithm: SAC, Device: cpu
2023-04-04 16:19:45 - r - INFO: - Episode: 1/20, Reward: 247.478, Step: 230
2023-04-04 16:19:49 - r - INFO: - Episode: 2/20, Reward: 260.547, Step: 195
2023-04-04 16:19:53 - r - INFO: - Episode: 3/20, Reward: 259.074, Step: 178
2023-04-04 16:19:57 - r - INFO: - Episode: 4/20, Reward: 296.493, Step: 192
2023-04-04 16:20:01 - r - INFO: - Episode: 5/20, Reward: 292.460, Step: 225
2023-04-04 16:20:07 - r - INFO: - Episode: 6/20, Reward: 282.687, Step: 294
2023-04-04 16:20:12 - r - INFO: - Episode: 7/20, Reward: 239.822, Step: 242
2023-04-04 16:20:16 - r - INFO: - Episode: 8/20, Reward: 270.872, Step: 196
2023-04-04 16:20:21 - r - INFO: - Episode: 9/20, Reward: 276.446, Step: 213
2023-04-04 16:20:24 - r - INFO: - Episode: 10/20, Reward: 284.918, Step: 186
2023-04-04 16:20:31 - r - INFO: - Episode: 11/20, Reward: 278.167, Step: 305
2023-04-04 16:20:34 - r - INFO: - Episode: 12/20, Reward: 294.946, Step: 180
2023-04-04 16:20:39 - r - INFO: - Episode: 13/20, Reward: 277.009, Step: 211
2023-04-04 16:20:43 - r - INFO: - Episode: 14/20, Reward: 275.229, Step: 199
2023-04-04 16:20:48 - r - INFO: - Episode: 15/20, Reward: 283.965, Step: 237
2023-04-04 16:20:52 - r - INFO: - Episode: 16/20, Reward: 268.659, Step: 226
2023-04-04 16:20:57 - r - INFO: - Episode: 17/20, Reward: 277.079, Step: 235
2023-04-04 16:21:02 - r - INFO: - Episode: 18/20, Reward: 263.336, Step: 245
2023-04-04 16:21:07 - r - INFO: - Episode: 19/20, Reward: 238.160, Step: 221
2023-04-04 16:21:12 - r - INFO: - Episode: 20/20, Reward: 293.206, Step: 257
2023-04-04 16:21:12 - r - INFO: - Finish testing!