File size: 5,451 Bytes
62e03a2
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
2023-03-31 23:14:42 - r - INFO: - Hyperparameters:
2023-03-31 23:14:42 - r - INFO: - ================================================================================
2023-03-31 23:14:42 - r - INFO: -         Name        	       Value        	        Type        
2023-03-31 23:14:42 - r - INFO: -       env_name      	    CartPole-v1     	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -     new_step_api    	         1          	   <class 'bool'>   
2023-03-31 23:14:42 - r - INFO: -       wrapper       	        None        	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -        render       	         0          	   <class 'bool'>   
2023-03-31 23:14:42 - r - INFO: -      algo_name      	      PER_DQN       	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -         mode        	        test        	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -         seed        	         1          	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -        device       	        cuda        	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -      train_eps      	        100         	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -       test_eps      	         10         	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -       eval_eps      	         10         	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -   eval_per_episode  	         5          	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -      max_steps      	        200         	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -   load_checkpoint   	         1          	   <class 'bool'>   
2023-03-31 23:14:42 - r - INFO: -      load_path      	Train_CartPole-v1_PER_DQN_20230331-225815	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -       show_fig      	         0          	   <class 'bool'>   
2023-03-31 23:14:42 - r - INFO: -       save_fig      	         1          	   <class 'bool'>   
2023-03-31 23:14:42 - r - INFO: -    epsilon_start    	        0.95        	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -     epsilon_end     	        0.01        	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -    epsilon_decay    	        500         	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -      hidden_dim     	        256         	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -        gamma        	        0.99        	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -          lr         	       0.0001       	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -     buffer_size     	       100000       	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -      per_alpha      	        0.6         	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -       per_beta      	        0.4         	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -  per_beta_annealing 	       0.001        	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -     per_epsilon     	        0.01        	  <class 'float'>   
2023-03-31 23:14:42 - r - INFO: -      batch_size     	         64         	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -    target_update    	         4          	   <class 'int'>    
2023-03-31 23:14:42 - r - INFO: -     value_layers    	[{'layer_type': 'linear', 'layer_dim': ['n_states', 256], 'activation': 'relu'}, {'layer_type': 'linear', 'layer_dim': [256, 256], 'activation': 'relu'}, {'layer_type': 'linear', 'layer_dim': [256, 'n_actions'], 'activation': 'none'}]	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -       task_dir      	C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_PER_DQN_20230331-231442	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -       res_dir       	C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_PER_DQN_20230331-231442/results	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -       log_dir       	C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_PER_DQN_20230331-231442/logs	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -       traj_dir      	C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_PER_DQN_20230331-231442/traj	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: -        tb_dir       	C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_PER_DQN_20230331-231442/tb_logs	   <class 'str'>    
2023-03-31 23:14:42 - r - INFO: - ================================================================================
2023-03-31 23:14:42 - r - INFO: - n_states: 4, n_actions: 2
2023-03-31 23:14:43 - r - INFO: - Start testing!
2023-03-31 23:14:43 - r - INFO: - Env: CartPole-v1, Algorithm: PER_DQN, Device: cuda
2023-03-31 23:14:44 - r - INFO: - Episode: 1/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 2/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 3/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 4/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 5/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 6/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 7/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 8/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 9/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Episode: 10/10, Reward: 200.000, Step: 200
2023-03-31 23:14:44 - r - INFO: - Finish testing!