diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/config.yaml b/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/config.yaml deleted file mode 100644 index b823e8bf27e5b4ebc61371d02b6ba01bb999c46e..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/config.yaml +++ /dev/null @@ -1,29 +0,0 @@ -general_cfg: - algo_name: NoisyDQN - device: cpu - env_name: CartPole-v1 - eval_eps: 10 - eval_per_episode: 5 - load_checkpoint: true - load_path: Train_CartPole-v1_NoisyDQN_20230318-162139 - max_steps: 200 - mode: test - new_step_api: true - render: false - save_fig: true - seed: 1 - show_fig: false - test_eps: 10 - train_eps: 100 - wrapper: null -algo_cfg: - batch_size: 64 - buffer_size: 100000 - epsilon_decay: 500 - epsilon_end: 0.01 - epsilon_start: 0.95 - gamma: 0.95 - hidden_dim: 256 - lr: 0.0001 - target_update: 4 - tau: 1.0 diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/logs/log.txt b/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/logs/log.txt deleted file mode 100644 index 2421d393873f81b8759b75b457b3599d6e9901f8..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/logs/log.txt +++ /dev/null @@ -1,50 +0,0 @@ -2023-03-18 16:26:30 - r - INFO: - Hyperparameters: -2023-03-18 16:26:30 - r - INFO: - ================================================================================ -2023-03-18 16:26:30 - r - INFO: - Name Value Type -2023-03-18 16:26:30 - r - INFO: - env_name CartPole-v1 -2023-03-18 16:26:30 - r - INFO: - new_step_api 1 -2023-03-18 16:26:30 - r - INFO: - wrapper None -2023-03-18 16:26:30 - r - INFO: - render 0 -2023-03-18 16:26:30 - r - INFO: - algo_name NoisyDQN -2023-03-18 16:26:30 - r - INFO: - mode test -2023-03-18 16:26:30 - r - INFO: - seed 1 -2023-03-18 16:26:30 - r - INFO: - device cpu -2023-03-18 16:26:30 - r - INFO: - train_eps 100 -2023-03-18 16:26:30 - r - INFO: - test_eps 10 -2023-03-18 16:26:30 - r - INFO: - eval_eps 10 -2023-03-18 16:26:30 - r - INFO: - eval_per_episode 5 -2023-03-18 16:26:30 - r - INFO: - max_steps 200 -2023-03-18 16:26:30 - r - INFO: - load_checkpoint 1 -2023-03-18 16:26:30 - r - INFO: - load_path Train_CartPole-v1_NoisyDQN_20230318-162139 -2023-03-18 16:26:30 - r - INFO: - show_fig 0 -2023-03-18 16:26:30 - r - INFO: - save_fig 1 -2023-03-18 16:26:30 - r - INFO: - epsilon_start 0.95 -2023-03-18 16:26:30 - r - INFO: - tau 1.0 -2023-03-18 16:26:30 - r - INFO: - epsilon_end 0.01 -2023-03-18 16:26:30 - r - INFO: - epsilon_decay 500 -2023-03-18 16:26:30 - r - INFO: - hidden_dim 256 -2023-03-18 16:26:30 - r - INFO: - gamma 0.95 -2023-03-18 16:26:30 - r - INFO: - lr 0.0001 -2023-03-18 16:26:30 - r - INFO: - buffer_size 100000 -2023-03-18 16:26:30 - r - INFO: - batch_size 64 -2023-03-18 16:26:30 - r - INFO: - target_update 4 -2023-03-18 16:26:30 - r - INFO: - task_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_NoisyDQN_20230318-162630 -2023-03-18 16:26:30 - r - INFO: - res_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_NoisyDQN_20230318-162630/results -2023-03-18 16:26:30 - r - INFO: - log_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_NoisyDQN_20230318-162630/logs -2023-03-18 16:26:30 - r - INFO: - traj_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_NoisyDQN_20230318-162630/traj -2023-03-18 16:26:30 - r - INFO: - tb_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Test_CartPole-v1_NoisyDQN_20230318-162630/tb_logs -2023-03-18 16:26:30 - r - INFO: - ================================================================================ -2023-03-18 16:26:30 - r - INFO: - n_states: 4, n_actions: 2 -2023-03-18 16:26:30 - r - INFO: - Start testing! -2023-03-18 16:26:30 - r - INFO: - Env: CartPole-v1, Algorithm: NoisyDQN, Device: cpu -2023-03-18 16:26:30 - r - INFO: - Episode: 1/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 2/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 3/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 4/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 5/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 6/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 7/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 8/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 9/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Episode: 10/10, Reward: 200.000, Step: 200 -2023-03-18 16:26:30 - r - INFO: - Finish testing! diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/models/checkpoint.pt b/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/models/checkpoint.pt deleted file mode 100644 index 3aa536480797ae052c46c05f6e9c38201887cdad..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/models/checkpoint.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c018ce117a1834aec6f585e6be780865631d49a8a81fb42ee4db9602b49793f5 -size 804667 diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/results/learning_curve.png b/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/results/learning_curve.png deleted file mode 100644 index 210820b85c519eeeedf89c35f3ca7f5cd798f3ff..0000000000000000000000000000000000000000 Binary files a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/results/learning_curve.png and /dev/null differ diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/tb_logs/events.out.tfevents.1679127990.DESKTOP-H34HQIQ.41784.0 b/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/tb_logs/events.out.tfevents.1679127990.DESKTOP-H34HQIQ.41784.0 deleted file mode 100644 index 47d238227c8026a005c1b4612304ebf1186af257..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/tb_logs/events.out.tfevents.1679127990.DESKTOP-H34HQIQ.41784.0 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:eab9ab499eeb1c82fc01c7c5112993d777beb0303452a699ecf6b3327d1d5857 -size 40 diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/config.yaml b/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/config.yaml deleted file mode 100644 index 804a5013b9280434a87a84bb56d702334e602c9a..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/config.yaml +++ /dev/null @@ -1,36 +0,0 @@ -general_cfg: - algo_name: NoisyDQN - device: cpu - env_name: gym - eval_eps: 10 - eval_per_episode: 5 - load_checkpoint: true - load_path: Train_CartPole-v1_NoisyDQN_mp_20230413-220639 - max_steps: 200 - mode: test - mp_backend: mp - n_workers: 1 - new_step_api: true - render: false - render_mode: human - save_fig: true - seed: 1 - show_fig: false - test_eps: 10 - train_eps: 200 - wrapper: null -algo_cfg: - batch_size: 64 - buffer_size: 100000 - epsilon_decay: 500 - epsilon_end: 0.01 - epsilon_start: 0.95 - gamma: 0.95 - hidden_dim: 256 - lr: 0.0001 - target_update: 4 - tau: 1.0 -env_cfg: - id: CartPole-v1 - new_step_api: true - render_mode: null diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/logs/log.txt b/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/logs/log.txt deleted file mode 100644 index 555e43072353e164e41ca8f8d12cf4a697c26cb6..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/logs/log.txt +++ /dev/null @@ -1,54 +0,0 @@ -2023-04-13 22:10:12 - r - INFO: - Hyperparameters: -2023-04-13 22:10:12 - r - INFO: - ================================================================================ -2023-04-13 22:10:12 - r - INFO: - Name Value Type -2023-04-13 22:10:12 - r - INFO: - env_name gym -2023-04-13 22:10:12 - r - INFO: - new_step_api 1 -2023-04-13 22:10:12 - r - INFO: - wrapper None -2023-04-13 22:10:12 - r - INFO: - render 0 -2023-04-13 22:10:12 - r - INFO: - render_mode None -2023-04-13 22:10:12 - r - INFO: - algo_name NoisyDQN -2023-04-13 22:10:12 - r - INFO: - mode test -2023-04-13 22:10:12 - r - INFO: - mp_backend mp -2023-04-13 22:10:12 - r - INFO: - seed 1 -2023-04-13 22:10:12 - r - INFO: - device cpu -2023-04-13 22:10:12 - r - INFO: - train_eps 200 -2023-04-13 22:10:12 - r - INFO: - test_eps 10 -2023-04-13 22:10:12 - r - INFO: - eval_eps 10 -2023-04-13 22:10:12 - r - INFO: - eval_per_episode 5 -2023-04-13 22:10:12 - r - INFO: - max_steps 200 -2023-04-13 22:10:12 - r - INFO: - load_checkpoint 1 -2023-04-13 22:10:12 - r - INFO: - load_path Train_CartPole-v1_NoisyDQN_mp_20230413-220639 -2023-04-13 22:10:12 - r - INFO: - show_fig 0 -2023-04-13 22:10:12 - r - INFO: - save_fig 1 -2023-04-13 22:10:12 - r - INFO: - n_workers 1 -2023-04-13 22:10:12 - r - INFO: - epsilon_start 0.95 -2023-04-13 22:10:12 - r - INFO: - tau 1.0 -2023-04-13 22:10:12 - r - INFO: - epsilon_end 0.01 -2023-04-13 22:10:12 - r - INFO: - epsilon_decay 500 -2023-04-13 22:10:12 - r - INFO: - hidden_dim 256 -2023-04-13 22:10:12 - r - INFO: - gamma 0.95 -2023-04-13 22:10:12 - r - INFO: - lr 0.0001 -2023-04-13 22:10:12 - r - INFO: - buffer_size 100000 -2023-04-13 22:10:12 - r - INFO: - batch_size 64 -2023-04-13 22:10:12 - r - INFO: - target_update 4 -2023-04-13 22:10:12 - r - INFO: - id CartPole-v1 -2023-04-13 22:10:12 - r - INFO: - task_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230413-221012 -2023-04-13 22:10:12 - r - INFO: - res_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230413-221012/results -2023-04-13 22:10:12 - r - INFO: - log_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230413-221012/logs -2023-04-13 22:10:12 - r - INFO: - traj_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230413-221012/traj -2023-04-13 22:10:12 - r - INFO: - video_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230413-221012/videos -2023-04-13 22:10:12 - r - INFO: - ================================================================================ -2023-04-13 22:10:12 - r - INFO: - n_states: 4, n_actions: 2 -2023-04-13 22:10:12 - r - INFO: - Start testing! -2023-04-13 22:10:12 - r - INFO: - Env: gym, Algorithm: NoisyDQN, Device: cpu -2023-04-13 22:10:12 - r - INFO: - Episode: 1/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 2/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 3/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 4/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 5/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 6/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 7/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 8/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 9/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Episode: 10/10, Reward: 200.000, Step: 200 -2023-04-13 22:10:12 - r - INFO: - Finish testing! diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/models/checkpoint.pt b/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/models/checkpoint.pt deleted file mode 100644 index ee646c7afec5e202c73770cd5fc016b932f986e6..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/models/checkpoint.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ab846435c3ac88c2507622e5f1050d4be6bfc94e33845dc5d7de2fac6df2c92f -size 804667 diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/results/learning_curve.png b/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/results/learning_curve.png deleted file mode 100644 index 0f2e6d031302ee37d97fa4072c63d9da2afba89c..0000000000000000000000000000000000000000 Binary files a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/results/learning_curve.png and /dev/null differ diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/config.yaml b/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/config.yaml deleted file mode 100644 index 236f3f63962bceb5e2848d94130132aae8f58263..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/config.yaml +++ /dev/null @@ -1,36 +0,0 @@ -general_cfg: - algo_name: NoisyDQN - device: cpu - env_name: gym - eval_eps: 10 - eval_per_episode: 5 - load_checkpoint: true - load_path: Train_gym_NoisyDQN_20230414-101351 - max_steps: 200 - mode: test - mp_backend: ray - n_workers: 1 - new_step_api: true - render: false - render_mode: human - save_fig: true - seed: 1 - show_fig: false - test_eps: 10 - train_eps: 200 - wrapper: null -algo_cfg: - batch_size: 64 - buffer_size: 100000 - epsilon_decay: 500 - epsilon_end: 0.01 - epsilon_start: 0.95 - gamma: 0.95 - hidden_dim: 256 - lr: 0.0001 - target_update: 4 - tau: 1.0 -env_cfg: - id: CartPole-v1 - new_step_api: true - render_mode: null diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/logs/log.txt b/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/logs/log.txt deleted file mode 100644 index 6d7b2d60ecb42fdac6fcc6cf6c99954ef6f26e6e..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/logs/log.txt +++ /dev/null @@ -1,54 +0,0 @@ -2023-04-14 10:19:26 - r - INFO: - Hyperparameters: -2023-04-14 10:19:26 - r - INFO: - ================================================================================ -2023-04-14 10:19:26 - r - INFO: - Name Value Type -2023-04-14 10:19:26 - r - INFO: - env_name gym -2023-04-14 10:19:26 - r - INFO: - new_step_api 1 -2023-04-14 10:19:26 - r - INFO: - wrapper None -2023-04-14 10:19:26 - r - INFO: - render 0 -2023-04-14 10:19:26 - r - INFO: - render_mode None -2023-04-14 10:19:26 - r - INFO: - algo_name NoisyDQN -2023-04-14 10:19:26 - r - INFO: - mode test -2023-04-14 10:19:26 - r - INFO: - mp_backend ray -2023-04-14 10:19:26 - r - INFO: - seed 1 -2023-04-14 10:19:26 - r - INFO: - device cpu -2023-04-14 10:19:26 - r - INFO: - train_eps 200 -2023-04-14 10:19:26 - r - INFO: - test_eps 10 -2023-04-14 10:19:26 - r - INFO: - eval_eps 10 -2023-04-14 10:19:26 - r - INFO: - eval_per_episode 5 -2023-04-14 10:19:26 - r - INFO: - max_steps 200 -2023-04-14 10:19:26 - r - INFO: - load_checkpoint 1 -2023-04-14 10:19:26 - r - INFO: - load_path Train_gym_NoisyDQN_20230414-101351 -2023-04-14 10:19:26 - r - INFO: - show_fig 0 -2023-04-14 10:19:26 - r - INFO: - save_fig 1 -2023-04-14 10:19:26 - r - INFO: - n_workers 1 -2023-04-14 10:19:26 - r - INFO: - epsilon_start 0.95 -2023-04-14 10:19:26 - r - INFO: - tau 1.0 -2023-04-14 10:19:26 - r - INFO: - epsilon_end 0.01 -2023-04-14 10:19:26 - r - INFO: - epsilon_decay 500 -2023-04-14 10:19:26 - r - INFO: - hidden_dim 256 -2023-04-14 10:19:26 - r - INFO: - gamma 0.95 -2023-04-14 10:19:26 - r - INFO: - lr 0.0001 -2023-04-14 10:19:26 - r - INFO: - buffer_size 100000 -2023-04-14 10:19:26 - r - INFO: - batch_size 64 -2023-04-14 10:19:26 - r - INFO: - target_update 4 -2023-04-14 10:19:26 - r - INFO: - id CartPole-v1 -2023-04-14 10:19:26 - r - INFO: - task_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230414-101926 -2023-04-14 10:19:26 - r - INFO: - res_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230414-101926/results -2023-04-14 10:19:26 - r - INFO: - log_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230414-101926/logs -2023-04-14 10:19:26 - r - INFO: - traj_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230414-101926/traj -2023-04-14 10:19:26 - r - INFO: - video_dir /media/disk/gsc/joyrl-offline/tasks/Test_gym_NoisyDQN_20230414-101926/videos -2023-04-14 10:19:26 - r - INFO: - ================================================================================ -2023-04-14 10:19:26 - r - INFO: - n_states: 4, n_actions: 2 -2023-04-14 10:19:26 - r - INFO: - Start testing! -2023-04-14 10:19:26 - r - INFO: - Env: gym, Algorithm: NoisyDQN, Device: cpu -2023-04-14 10:19:26 - r - INFO: - Episode: 1/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:26 - r - INFO: - Episode: 2/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:26 - r - INFO: - Episode: 3/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:26 - r - INFO: - Episode: 4/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:26 - r - INFO: - Episode: 5/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:26 - r - INFO: - Episode: 6/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:26 - r - INFO: - Episode: 7/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:26 - r - INFO: - Episode: 8/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:27 - r - INFO: - Episode: 9/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:27 - r - INFO: - Episode: 10/10, Reward: 200.000, Step: 200 -2023-04-14 10:19:27 - r - INFO: - Finish testing! diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/models/checkpoint.pt b/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/models/checkpoint.pt deleted file mode 100644 index 5c648ab8e0e4d608b462bcff135f583c4594ea2f..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/models/checkpoint.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:96c4f99970f7ebbc667d28e3f1c8c05399296b0257a95025ab12b4eca17d3919 -size 804667 diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/results/learning_curve.png b/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/results/learning_curve.png deleted file mode 100644 index 0f2e6d031302ee37d97fa4072c63d9da2afba89c..0000000000000000000000000000000000000000 Binary files a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/results/learning_curve.png and /dev/null differ diff --git a/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/res.csv b/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/res.csv deleted file mode 100644 index cbbcf2eb2cccfce2f3060e96b3484890fe578ac1..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/res.csv +++ /dev/null @@ -1,11 +0,0 @@ -episodes,rewards,steps -0,200.0,200 -1,200.0,200 -2,200.0,200 -3,200.0,200 -4,200.0,200 -5,200.0,200 -6,200.0,200 -7,200.0,200 -8,200.0,200 -9,200.0,200 diff --git a/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/res.csv b/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/res.csv deleted file mode 100644 index cbbcf2eb2cccfce2f3060e96b3484890fe578ac1..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/res.csv +++ /dev/null @@ -1,11 +0,0 @@ -episodes,rewards,steps -0,200.0,200 -1,200.0,200 -2,200.0,200 -3,200.0,200 -4,200.0,200 -5,200.0,200 -6,200.0,200 -7,200.0,200 -8,200.0,200 -9,200.0,200 diff --git a/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/res.csv b/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/res.csv deleted file mode 100644 index cbbcf2eb2cccfce2f3060e96b3484890fe578ac1..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/res.csv +++ /dev/null @@ -1,11 +0,0 @@ -episodes,rewards,steps -0,200.0,200 -1,200.0,200 -2,200.0,200 -3,200.0,200 -4,200.0,200 -5,200.0,200 -6,200.0,200 -7,200.0,200 -8,200.0,200 -9,200.0,200 diff --git a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/config.yaml b/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/config.yaml deleted file mode 100644 index 1e7a4cc61a537d3d4acb61a0b165811120d673fc..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/config.yaml +++ /dev/null @@ -1,44 +0,0 @@ -general_cfg: - algo_name: DQN - device: cpu - env_name: CartPole-v1 - eval_eps: 10 - eval_per_episode: 5 - load_checkpoint: true - load_path: Train_CartPole-v1_mp_DQN_20230319-215340 - max_steps: 200 - mode: test - n_workers: 1 - new_step_api: true - render: false - save_fig: true - seed: 1 - show_fig: false - test_eps: 20 - train_eps: 300 - wrapper: null -algo_cfg: - batch_size: 64 - buffer_size: 100000 - epsilon_decay: 500 - epsilon_end: 0.01 - epsilon_start: 0.95 - gamma: 0.95 - lr: 0.0001 - target_update: 4 - value_layers: - - activation: relu - layer_dim: - - n_states - - 256 - layer_type: linear - - activation: relu - layer_dim: - - 256 - - 256 - layer_type: linear - - activation: none - layer_dim: - - 256 - - n_actions - layer_type: linear diff --git a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/logs/log.txt b/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/logs/log.txt deleted file mode 100644 index 01d405051cfaa47b789f7f82ef4390cc5327b883..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/logs/log.txt +++ /dev/null @@ -1,60 +0,0 @@ -2023-03-19 21:58:06 - r - INFO: - Hyperparameters: -2023-03-19 21:58:06 - r - INFO: - ================================================================================ -2023-03-19 21:58:06 - r - INFO: - Name Value Type -2023-03-19 21:58:06 - r - INFO: - env_name CartPole-v1 -2023-03-19 21:58:06 - r - INFO: - new_step_api 1 -2023-03-19 21:58:06 - r - INFO: - wrapper None -2023-03-19 21:58:06 - r - INFO: - render 0 -2023-03-19 21:58:06 - r - INFO: - algo_name DQN -2023-03-19 21:58:06 - r - INFO: - mode test -2023-03-19 21:58:06 - r - INFO: - seed 1 -2023-03-19 21:58:06 - r - INFO: - device cpu -2023-03-19 21:58:06 - r - INFO: - train_eps 300 -2023-03-19 21:58:06 - r - INFO: - test_eps 20 -2023-03-19 21:58:06 - r - INFO: - eval_eps 10 -2023-03-19 21:58:06 - r - INFO: - eval_per_episode 5 -2023-03-19 21:58:06 - r - INFO: - max_steps 200 -2023-03-19 21:58:06 - r - INFO: - load_checkpoint 1 -2023-03-19 21:58:06 - r - INFO: - load_path Train_CartPole-v1_mp_DQN_20230319-215340 -2023-03-19 21:58:06 - r - INFO: - show_fig 0 -2023-03-19 21:58:06 - r - INFO: - save_fig 1 -2023-03-19 21:58:06 - r - INFO: - n_workers 1 -2023-03-19 21:58:06 - r - INFO: - epsilon_start 0.95 -2023-03-19 21:58:06 - r - INFO: - epsilon_end 0.01 -2023-03-19 21:58:06 - r - INFO: - epsilon_decay 500 -2023-03-19 21:58:06 - r - INFO: - gamma 0.95 -2023-03-19 21:58:06 - r - INFO: - lr 0.0001 -2023-03-19 21:58:06 - r - INFO: - buffer_size 100000 -2023-03-19 21:58:06 - r - INFO: - batch_size 64 -2023-03-19 21:58:06 - r - INFO: - target_update 4 -2023-03-19 21:58:06 - r - INFO: - value_layers [{'layer_type': 'linear', 'layer_dim': ['n_states', 256], 'activation': 'relu'}, {'layer_type': 'linear', 'layer_dim': [256, 256], 'activation': 'relu'}, {'layer_type': 'linear', 'layer_dim': [256, 'n_actions'], 'activation': 'none'}] -2023-03-19 21:58:06 - r - INFO: - task_dir /media/disk/gsc/joyrl-offline/tasks/Test_CartPole-v1_DQN_20230319-215806 -2023-03-19 21:58:06 - r - INFO: - res_dir /media/disk/gsc/joyrl-offline/tasks/Test_CartPole-v1_DQN_20230319-215806/results -2023-03-19 21:58:06 - r - INFO: - log_dir /media/disk/gsc/joyrl-offline/tasks/Test_CartPole-v1_DQN_20230319-215806/logs -2023-03-19 21:58:06 - r - INFO: - traj_dir /media/disk/gsc/joyrl-offline/tasks/Test_CartPole-v1_DQN_20230319-215806/traj -2023-03-19 21:58:06 - r - INFO: - tb_dir /media/disk/gsc/joyrl-offline/tasks/Test_CartPole-v1_DQN_20230319-215806/tb_logs -2023-03-19 21:58:06 - r - INFO: - ================================================================================ -2023-03-19 21:58:06 - r - INFO: - n_states: 4, n_actions: 2 -2023-03-19 21:58:06 - r - INFO: - Start testing! -2023-03-19 21:58:06 - r - INFO: - Env: CartPole-v1, Algorithm: DQN, Device: cpu -2023-03-19 21:58:07 - r - INFO: - Episode: 1/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 2/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 3/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 4/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 5/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 6/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 7/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 8/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 9/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 10/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 11/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 12/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 13/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 14/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 15/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 16/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 17/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 18/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 19/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Episode: 20/20, Reward: 200.000, Step: 200 -2023-03-19 21:58:07 - r - INFO: - Finish testing! diff --git a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/models/checkpoint.pt b/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/models/checkpoint.pt deleted file mode 100644 index e20bc5cbeafb154ae2c3816a36507e9e8c5b34ae..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/models/checkpoint.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:308eccb972f5142d25c00579d63ecd9ae50df94fcdd9bb172d00217e9db3dd12 -size 272407 diff --git a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/results/learning_curve.png b/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/results/learning_curve.png deleted file mode 100644 index 5084beef5e93d281c8ae9ad28e4f0f7934e7b925..0000000000000000000000000000000000000000 Binary files a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/results/learning_curve.png and /dev/null differ diff --git a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/results/res.csv b/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/results/res.csv deleted file mode 100644 index bbcf538967643440c57b300a16b93f8465e2ab9f..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/results/res.csv +++ /dev/null @@ -1,21 +0,0 @@ -episodes,rewards,steps -0,200.0,200 -1,200.0,200 -2,200.0,200 -3,200.0,200 -4,200.0,200 -5,200.0,200 -6,200.0,200 -7,200.0,200 -8,200.0,200 -9,200.0,200 -10,200.0,200 -11,200.0,200 -12,200.0,200 -13,200.0,200 -14,200.0,200 -15,200.0,200 -16,200.0,200 -17,200.0,200 -18,200.0,200 -19,200.0,200 diff --git a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/tb_logs/events.out.tfevents.1679234286.ML3090.3788443.0 b/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/tb_logs/events.out.tfevents.1679234286.ML3090.3788443.0 deleted file mode 100644 index aeb11a4cee5596929ed39f058b33a74f0791349c..0000000000000000000000000000000000000000 --- a/CartPole-v1/Test_CartPole-v1_mp_DQN_20230319-215806/tb_logs/events.out.tfevents.1679234286.ML3090.3788443.0 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:86913021f0ed612b76dea0115a72ea9ca414e36e4a9b8ba768ae086473f616d8 -size 40 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/config.yaml b/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/config.yaml deleted file mode 100644 index 16cfc077edc93491b75e80245132c3c924df26e1..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/config.yaml +++ /dev/null @@ -1,29 +0,0 @@ -general_cfg: - algo_name: NoisyDQN - device: cpu - env_name: CartPole-v1 - eval_eps: 10 - eval_per_episode: 5 - load_checkpoint: false - load_path: Train_CartPole-v1_NoisyDQN - max_steps: 200 - mode: train - new_step_api: true - render: false - save_fig: true - seed: 1 - show_fig: false - test_eps: 10 - train_eps: 100 - wrapper: null -algo_cfg: - batch_size: 64 - buffer_size: 100000 - epsilon_decay: 500 - epsilon_end: 0.01 - epsilon_start: 0.95 - gamma: 0.95 - hidden_dim: 256 - lr: 0.0001 - target_update: 4 - tau: 1.0 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/logs/log.txt b/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/logs/log.txt deleted file mode 100644 index 8863b77f4b7bc26281e0cd1cbc340f537a31c11b..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/logs/log.txt +++ /dev/null @@ -1,153 +0,0 @@ -2023-03-18 16:21:39 - r - INFO: - Hyperparameters: -2023-03-18 16:21:39 - r - INFO: - ================================================================================ -2023-03-18 16:21:39 - r - INFO: - Name Value Type -2023-03-18 16:21:39 - r - INFO: - env_name CartPole-v1 -2023-03-18 16:21:39 - r - INFO: - new_step_api 1 -2023-03-18 16:21:39 - r - INFO: - wrapper None -2023-03-18 16:21:39 - r - INFO: - render 0 -2023-03-18 16:21:39 - r - INFO: - algo_name NoisyDQN -2023-03-18 16:21:39 - r - INFO: - mode train -2023-03-18 16:21:39 - r - INFO: - seed 1 -2023-03-18 16:21:39 - r - INFO: - device cpu -2023-03-18 16:21:39 - r - INFO: - train_eps 100 -2023-03-18 16:21:39 - r - INFO: - test_eps 10 -2023-03-18 16:21:39 - r - INFO: - eval_eps 10 -2023-03-18 16:21:39 - r - INFO: - eval_per_episode 5 -2023-03-18 16:21:39 - r - INFO: - max_steps 200 -2023-03-18 16:21:39 - r - INFO: - load_checkpoint 0 -2023-03-18 16:21:39 - r - INFO: - load_path Train_CartPole-v1_NoisyDQN -2023-03-18 16:21:39 - r - INFO: - show_fig 0 -2023-03-18 16:21:39 - r - INFO: - save_fig 1 -2023-03-18 16:21:39 - r - INFO: - epsilon_start 0.95 -2023-03-18 16:21:39 - r - INFO: - tau 1.0 -2023-03-18 16:21:39 - r - INFO: - epsilon_end 0.01 -2023-03-18 16:21:39 - r - INFO: - epsilon_decay 500 -2023-03-18 16:21:39 - r - INFO: - hidden_dim 256 -2023-03-18 16:21:39 - r - INFO: - gamma 0.95 -2023-03-18 16:21:39 - r - INFO: - lr 0.0001 -2023-03-18 16:21:39 - r - INFO: - buffer_size 100000 -2023-03-18 16:21:39 - r - INFO: - batch_size 64 -2023-03-18 16:21:39 - r - INFO: - target_update 4 -2023-03-18 16:21:39 - r - INFO: - task_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Train_CartPole-v1_NoisyDQN_20230318-162139 -2023-03-18 16:21:39 - r - INFO: - res_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Train_CartPole-v1_NoisyDQN_20230318-162139/results -2023-03-18 16:21:39 - r - INFO: - log_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Train_CartPole-v1_NoisyDQN_20230318-162139/logs -2023-03-18 16:21:39 - r - INFO: - traj_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Train_CartPole-v1_NoisyDQN_20230318-162139/traj -2023-03-18 16:21:39 - r - INFO: - tb_dir C:\Users\24438\Desktop\joyrl-offline/tasks/Train_CartPole-v1_NoisyDQN_20230318-162139/tb_logs -2023-03-18 16:21:39 - r - INFO: - ================================================================================ -2023-03-18 16:21:39 - r - INFO: - n_states: 4, n_actions: 2 -2023-03-18 16:21:39 - r - INFO: - Start training! -2023-03-18 16:21:39 - r - INFO: - Env: CartPole-v1, Algorithm: NoisyDQN, Device: cpu -2023-03-18 16:21:39 - r - INFO: - Episode: 1/100, Reward: 16.000, Step: 16 -2023-03-18 16:21:39 - r - INFO: - Episode: 2/100, Reward: 16.000, Step: 16 -2023-03-18 16:21:39 - r - INFO: - Episode: 3/100, Reward: 18.000, Step: 18 -2023-03-18 16:21:39 - r - INFO: - Episode: 4/100, Reward: 14.000, Step: 14 -2023-03-18 16:21:39 - r - INFO: - Episode: 5/100, Reward: 22.000, Step: 22 -2023-03-18 16:21:39 - r - INFO: - Current episode 5 has the best eval reward: 9.300 -2023-03-18 16:21:39 - r - INFO: - Episode: 6/100, Reward: 27.000, Step: 27 -2023-03-18 16:21:40 - r - INFO: - Episode: 7/100, Reward: 9.000, Step: 9 -2023-03-18 16:21:40 - r - INFO: - Episode: 8/100, Reward: 13.000, Step: 13 -2023-03-18 16:21:40 - r - INFO: - Episode: 9/100, Reward: 17.000, Step: 17 -2023-03-18 16:21:40 - r - INFO: - Episode: 10/100, Reward: 37.000, Step: 37 -2023-03-18 16:21:40 - r - INFO: - Current episode 10 has the best eval reward: 9.500 -2023-03-18 16:21:40 - r - INFO: - Episode: 11/100, Reward: 15.000, Step: 15 -2023-03-18 16:21:40 - r - INFO: - Episode: 12/100, Reward: 22.000, Step: 22 -2023-03-18 16:21:40 - r - INFO: - Episode: 13/100, Reward: 9.000, Step: 9 -2023-03-18 16:21:40 - r - INFO: - Episode: 14/100, Reward: 14.000, Step: 14 -2023-03-18 16:21:40 - r - INFO: - Episode: 15/100, Reward: 12.000, Step: 12 -2023-03-18 16:21:40 - r - INFO: - Current episode 15 has the best eval reward: 9.700 -2023-03-18 16:21:40 - r - INFO: - Episode: 16/100, Reward: 16.000, Step: 16 -2023-03-18 16:21:40 - r - INFO: - Episode: 17/100, Reward: 16.000, Step: 16 -2023-03-18 16:21:40 - r - INFO: - Episode: 18/100, Reward: 14.000, Step: 14 -2023-03-18 16:21:40 - r - INFO: - Episode: 19/100, Reward: 11.000, Step: 11 -2023-03-18 16:21:40 - r - INFO: - Episode: 20/100, Reward: 13.000, Step: 13 -2023-03-18 16:21:40 - r - INFO: - Current episode 20 has the best eval reward: 9.700 -2023-03-18 16:21:40 - r - INFO: - Episode: 21/100, Reward: 13.000, Step: 13 -2023-03-18 16:21:42 - r - INFO: - Episode: 22/100, Reward: 14.000, Step: 14 -2023-03-18 16:21:42 - r - INFO: - Episode: 23/100, Reward: 14.000, Step: 14 -2023-03-18 16:21:42 - r - INFO: - Episode: 24/100, Reward: 37.000, Step: 37 -2023-03-18 16:21:42 - r - INFO: - Episode: 25/100, Reward: 12.000, Step: 12 -2023-03-18 16:21:42 - r - INFO: - Episode: 26/100, Reward: 18.000, Step: 18 -2023-03-18 16:21:42 - r - INFO: - Episode: 27/100, Reward: 13.000, Step: 13 -2023-03-18 16:21:42 - r - INFO: - Episode: 28/100, Reward: 20.000, Step: 20 -2023-03-18 16:21:43 - r - INFO: - Episode: 29/100, Reward: 17.000, Step: 17 -2023-03-18 16:21:43 - r - INFO: - Episode: 30/100, Reward: 10.000, Step: 10 -2023-03-18 16:21:43 - r - INFO: - Current episode 30 has the best eval reward: 13.700 -2023-03-18 16:21:43 - r - INFO: - Episode: 31/100, Reward: 10.000, Step: 10 -2023-03-18 16:21:43 - r - INFO: - Episode: 32/100, Reward: 12.000, Step: 12 -2023-03-18 16:21:43 - r - INFO: - Episode: 33/100, Reward: 11.000, Step: 11 -2023-03-18 16:21:43 - r - INFO: - Episode: 34/100, Reward: 12.000, Step: 12 -2023-03-18 16:21:43 - r - INFO: - Episode: 35/100, Reward: 17.000, Step: 17 -2023-03-18 16:21:43 - r - INFO: - Current episode 35 has the best eval reward: 32.500 -2023-03-18 16:21:43 - r - INFO: - Episode: 36/100, Reward: 17.000, Step: 17 -2023-03-18 16:21:43 - r - INFO: - Episode: 37/100, Reward: 17.000, Step: 17 -2023-03-18 16:21:43 - r - INFO: - Episode: 38/100, Reward: 23.000, Step: 23 -2023-03-18 16:21:43 - r - INFO: - Episode: 39/100, Reward: 35.000, Step: 35 -2023-03-18 16:21:43 - r - INFO: - Episode: 40/100, Reward: 46.000, Step: 46 -2023-03-18 16:21:44 - r - INFO: - Episode: 41/100, Reward: 10.000, Step: 10 -2023-03-18 16:21:44 - r - INFO: - Episode: 42/100, Reward: 13.000, Step: 13 -2023-03-18 16:21:44 - r - INFO: - Episode: 43/100, Reward: 27.000, Step: 27 -2023-03-18 16:21:44 - r - INFO: - Episode: 44/100, Reward: 43.000, Step: 43 -2023-03-18 16:21:44 - r - INFO: - Episode: 45/100, Reward: 23.000, Step: 23 -2023-03-18 16:21:44 - r - INFO: - Episode: 46/100, Reward: 31.000, Step: 31 -2023-03-18 16:21:44 - r - INFO: - Episode: 47/100, Reward: 36.000, Step: 36 -2023-03-18 16:21:44 - r - INFO: - Episode: 48/100, Reward: 27.000, Step: 27 -2023-03-18 16:21:44 - r - INFO: - Episode: 49/100, Reward: 27.000, Step: 27 -2023-03-18 16:21:44 - r - INFO: - Episode: 50/100, Reward: 40.000, Step: 40 -2023-03-18 16:21:44 - r - INFO: - Current episode 50 has the best eval reward: 36.900 -2023-03-18 16:21:45 - r - INFO: - Episode: 51/100, Reward: 47.000, Step: 47 -2023-03-18 16:21:45 - r - INFO: - Episode: 52/100, Reward: 60.000, Step: 60 -2023-03-18 16:21:45 - r - INFO: - Episode: 53/100, Reward: 104.000, Step: 104 -2023-03-18 16:21:45 - r - INFO: - Episode: 54/100, Reward: 70.000, Step: 70 -2023-03-18 16:21:45 - r - INFO: - Episode: 55/100, Reward: 65.000, Step: 65 -2023-03-18 16:21:46 - r - INFO: - Episode: 56/100, Reward: 96.000, Step: 96 -2023-03-18 16:21:46 - r - INFO: - Episode: 57/100, Reward: 34.000, Step: 34 -2023-03-18 16:21:46 - r - INFO: - Episode: 58/100, Reward: 30.000, Step: 30 -2023-03-18 16:21:46 - r - INFO: - Episode: 59/100, Reward: 63.000, Step: 63 -2023-03-18 16:21:46 - r - INFO: - Episode: 60/100, Reward: 32.000, Step: 32 -2023-03-18 16:21:46 - r - INFO: - Current episode 60 has the best eval reward: 104.900 -2023-03-18 16:21:47 - r - INFO: - Episode: 61/100, Reward: 36.000, Step: 36 -2023-03-18 16:21:47 - r - INFO: - Episode: 62/100, Reward: 26.000, Step: 26 -2023-03-18 16:21:47 - r - INFO: - Episode: 63/100, Reward: 29.000, Step: 29 -2023-03-18 16:21:47 - r - INFO: - Episode: 64/100, Reward: 58.000, Step: 58 -2023-03-18 16:21:47 - r - INFO: - Episode: 65/100, Reward: 123.000, Step: 123 -2023-03-18 16:21:47 - r - INFO: - Episode: 66/100, Reward: 74.000, Step: 74 -2023-03-18 16:21:48 - r - INFO: - Episode: 67/100, Reward: 56.000, Step: 56 -2023-03-18 16:21:48 - r - INFO: - Episode: 68/100, Reward: 76.000, Step: 76 -2023-03-18 16:21:48 - r - INFO: - Episode: 69/100, Reward: 63.000, Step: 63 -2023-03-18 16:21:48 - r - INFO: - Episode: 70/100, Reward: 55.000, Step: 55 -2023-03-18 16:21:48 - r - INFO: - Episode: 71/100, Reward: 76.000, Step: 76 -2023-03-18 16:21:49 - r - INFO: - Episode: 72/100, Reward: 59.000, Step: 59 -2023-03-18 16:21:49 - r - INFO: - Episode: 73/100, Reward: 70.000, Step: 70 -2023-03-18 16:21:49 - r - INFO: - Episode: 74/100, Reward: 98.000, Step: 98 -2023-03-18 16:21:49 - r - INFO: - Episode: 75/100, Reward: 60.000, Step: 60 -2023-03-18 16:21:50 - r - INFO: - Episode: 76/100, Reward: 114.000, Step: 114 -2023-03-18 16:21:50 - r - INFO: - Episode: 77/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:51 - r - INFO: - Episode: 78/100, Reward: 199.000, Step: 199 -2023-03-18 16:21:51 - r - INFO: - Episode: 79/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:52 - r - INFO: - Episode: 80/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:52 - r - INFO: - Current episode 80 has the best eval reward: 200.000 -2023-03-18 16:21:53 - r - INFO: - Episode: 81/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:53 - r - INFO: - Episode: 82/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:54 - r - INFO: - Episode: 83/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:55 - r - INFO: - Episode: 84/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:55 - r - INFO: - Episode: 85/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:56 - r - INFO: - Current episode 85 has the best eval reward: 200.000 -2023-03-18 16:21:56 - r - INFO: - Episode: 86/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:57 - r - INFO: - Episode: 87/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:57 - r - INFO: - Episode: 88/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:58 - r - INFO: - Episode: 89/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:58 - r - INFO: - Episode: 90/100, Reward: 200.000, Step: 200 -2023-03-18 16:21:59 - r - INFO: - Current episode 90 has the best eval reward: 200.000 -2023-03-18 16:21:59 - r - INFO: - Episode: 91/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:00 - r - INFO: - Episode: 92/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:01 - r - INFO: - Episode: 93/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:01 - r - INFO: - Episode: 94/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:02 - r - INFO: - Episode: 95/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:02 - r - INFO: - Current episode 95 has the best eval reward: 200.000 -2023-03-18 16:22:03 - r - INFO: - Episode: 96/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:03 - r - INFO: - Episode: 97/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:04 - r - INFO: - Episode: 98/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:04 - r - INFO: - Episode: 99/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:05 - r - INFO: - Episode: 100/100, Reward: 200.000, Step: 200 -2023-03-18 16:22:05 - r - INFO: - Current episode 100 has the best eval reward: 200.000 -2023-03-18 16:22:05 - r - INFO: - Finish training! diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/models/checkpoint.pt b/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/models/checkpoint.pt deleted file mode 100644 index 3aa536480797ae052c46c05f6e9c38201887cdad..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/models/checkpoint.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:c018ce117a1834aec6f585e6be780865631d49a8a81fb42ee4db9602b49793f5 -size 804667 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/results/learning_curve.png b/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/results/learning_curve.png deleted file mode 100644 index f050a608bfa5d1d52a397b2b8099325e2c9bf96c..0000000000000000000000000000000000000000 Binary files a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/results/learning_curve.png and /dev/null differ diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/results/res.csv b/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/results/res.csv deleted file mode 100644 index 4ffbb62b37c834f897d291eeff3794e3f1380d56..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/results/res.csv +++ /dev/null @@ -1,101 +0,0 @@ -episodes,rewards,steps -0,16.0,16 -1,16.0,16 -2,18.0,18 -3,14.0,14 -4,22.0,22 -5,27.0,27 -6,9.0,9 -7,13.0,13 -8,17.0,17 -9,37.0,37 -10,15.0,15 -11,22.0,22 -12,9.0,9 -13,14.0,14 -14,12.0,12 -15,16.0,16 -16,16.0,16 -17,14.0,14 -18,11.0,11 -19,13.0,13 -20,13.0,13 -21,14.0,14 -22,14.0,14 -23,37.0,37 -24,12.0,12 -25,18.0,18 -26,13.0,13 -27,20.0,20 -28,17.0,17 -29,10.0,10 -30,10.0,10 -31,12.0,12 -32,11.0,11 -33,12.0,12 -34,17.0,17 -35,17.0,17 -36,17.0,17 -37,23.0,23 -38,35.0,35 -39,46.0,46 -40,10.0,10 -41,13.0,13 -42,27.0,27 -43,43.0,43 -44,23.0,23 -45,31.0,31 -46,36.0,36 -47,27.0,27 -48,27.0,27 -49,40.0,40 -50,47.0,47 -51,60.0,60 -52,104.0,104 -53,70.0,70 -54,65.0,65 -55,96.0,96 -56,34.0,34 -57,30.0,30 -58,63.0,63 -59,32.0,32 -60,36.0,36 -61,26.0,26 -62,29.0,29 -63,58.0,58 -64,123.0,123 -65,74.0,74 -66,56.0,56 -67,76.0,76 -68,63.0,63 -69,55.0,55 -70,76.0,76 -71,59.0,59 -72,70.0,70 -73,98.0,98 -74,60.0,60 -75,114.0,114 -76,200.0,200 -77,199.0,199 -78,200.0,200 -79,200.0,200 -80,200.0,200 -81,200.0,200 -82,200.0,200 -83,200.0,200 -84,200.0,200 -85,200.0,200 -86,200.0,200 -87,200.0,200 -88,200.0,200 -89,200.0,200 -90,200.0,200 -91,200.0,200 -92,200.0,200 -93,200.0,200 -94,200.0,200 -95,200.0,200 -96,200.0,200 -97,200.0,200 -98,200.0,200 -99,200.0,200 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/tb_logs/events.out.tfevents.1679127699.DESKTOP-H34HQIQ.2016.0 b/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/tb_logs/events.out.tfevents.1679127699.DESKTOP-H34HQIQ.2016.0 deleted file mode 100644 index 0905fc999961a6353897b236a0b111aa006d273e..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_20230318-162139/tb_logs/events.out.tfevents.1679127699.DESKTOP-H34HQIQ.2016.0 +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:df11f028f48b8106ff87f12754360e62af378e6795428875376d4cc9c70baca9 -size 40 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/config.yaml b/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/config.yaml deleted file mode 100644 index c7c11e4943aca50494a910ce9146adeeb34aaee4..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/config.yaml +++ /dev/null @@ -1,36 +0,0 @@ -general_cfg: - algo_name: NoisyDQN - device: cpu - env_name: gym - eval_eps: 10 - eval_per_episode: 5 - load_checkpoint: false - load_path: Train_CartPole-v1_NoisyDQN - max_steps: 200 - mode: train - mp_backend: mp - n_workers: 2 - new_step_api: true - render: false - render_mode: human - save_fig: true - seed: 1 - show_fig: false - test_eps: 10 - train_eps: 200 - wrapper: null -algo_cfg: - batch_size: 64 - buffer_size: 100000 - epsilon_decay: 500 - epsilon_end: 0.01 - epsilon_start: 0.95 - gamma: 0.95 - hidden_dim: 256 - lr: 0.0001 - target_update: 4 - tau: 1.0 -env_cfg: - id: CartPole-v1 - new_step_api: true - render_mode: null diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/logs/log.txt b/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/logs/log.txt deleted file mode 100644 index 0012a04afc32f9b02dd787d0b3c12139b314f0e5..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/logs/log.txt +++ /dev/null @@ -1,44 +0,0 @@ -2023-04-13 22:06:39 - r - INFO: - Hyperparameters: -2023-04-13 22:06:39 - r - INFO: - ================================================================================ -2023-04-13 22:06:39 - r - INFO: - Name Value Type -2023-04-13 22:06:39 - r - INFO: - env_name gym -2023-04-13 22:06:39 - r - INFO: - new_step_api 1 -2023-04-13 22:06:39 - r - INFO: - wrapper None -2023-04-13 22:06:39 - r - INFO: - render 0 -2023-04-13 22:06:39 - r - INFO: - render_mode None -2023-04-13 22:06:39 - r - INFO: - algo_name NoisyDQN -2023-04-13 22:06:39 - r - INFO: - mode train -2023-04-13 22:06:39 - r - INFO: - mp_backend mp -2023-04-13 22:06:39 - r - INFO: - seed 1 -2023-04-13 22:06:39 - r - INFO: - device cpu -2023-04-13 22:06:39 - r - INFO: - train_eps 200 -2023-04-13 22:06:39 - r - INFO: - test_eps 10 -2023-04-13 22:06:39 - r - INFO: - eval_eps 10 -2023-04-13 22:06:39 - r - INFO: - eval_per_episode 5 -2023-04-13 22:06:39 - r - INFO: - max_steps 200 -2023-04-13 22:06:39 - r - INFO: - load_checkpoint 0 -2023-04-13 22:06:39 - r - INFO: - load_path Train_CartPole-v1_NoisyDQN -2023-04-13 22:06:39 - r - INFO: - show_fig 0 -2023-04-13 22:06:39 - r - INFO: - save_fig 1 -2023-04-13 22:06:39 - r - INFO: - n_workers 2 -2023-04-13 22:06:39 - r - INFO: - epsilon_start 0.95 -2023-04-13 22:06:39 - r - INFO: - tau 1.0 -2023-04-13 22:06:39 - r - INFO: - epsilon_end 0.01 -2023-04-13 22:06:39 - r - INFO: - epsilon_decay 500 -2023-04-13 22:06:39 - r - INFO: - hidden_dim 256 -2023-04-13 22:06:39 - r - INFO: - gamma 0.95 -2023-04-13 22:06:39 - r - INFO: - lr 0.0001 -2023-04-13 22:06:39 - r - INFO: - buffer_size 100000 -2023-04-13 22:06:39 - r - INFO: - batch_size 64 -2023-04-13 22:06:39 - r - INFO: - target_update 4 -2023-04-13 22:06:39 - r - INFO: - id CartPole-v1 -2023-04-13 22:06:39 - r - INFO: - task_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230413-220639 -2023-04-13 22:06:39 - r - INFO: - res_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230413-220639/results -2023-04-13 22:06:39 - r - INFO: - log_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230413-220639/logs -2023-04-13 22:06:39 - r - INFO: - traj_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230413-220639/traj -2023-04-13 22:06:39 - r - INFO: - video_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230413-220639/videos -2023-04-13 22:06:39 - r - INFO: - ================================================================================ -2023-04-13 22:06:39 - r - INFO: - n_states: 4, n_actions: 2 -2023-04-13 22:06:39 - r - INFO: - Start training! -2023-04-13 22:06:39 - r - INFO: - Env: gym, Algorithm: NoisyDQN, Device: cpu -2023-04-13 22:07:32 - r - INFO: - Finish training! diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/models/checkpoint.pt b/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/models/checkpoint.pt deleted file mode 100644 index ee646c7afec5e202c73770cd5fc016b932f986e6..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/models/checkpoint.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:ab846435c3ac88c2507622e5f1050d4be6bfc94e33845dc5d7de2fac6df2c92f -size 804667 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/results/learning_curve.png b/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/results/learning_curve.png deleted file mode 100644 index 9b9e3adae071ea42b12fffa1d293327af1c652f4..0000000000000000000000000000000000000000 Binary files a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/results/learning_curve.png and /dev/null differ diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/results/res.csv b/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/results/res.csv deleted file mode 100644 index 509ec3519cb0b22651eed902fc76a81985c0b141..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_mp_20230413-220639/results/res.csv +++ /dev/null @@ -1,202 +0,0 @@ -episodes,rewards -0,24.0 -1,18.0 -2,18.0 -3,19.0 -4,27.0 -5,17.0 -6,15.0 -7,13.0 -8,21.0 -9,29.0 -10,16.0 -11,33.0 -12,9.0 -13,13.0 -14,11.0 -15,17.0 -16,10.0 -17,25.0 -18,13.0 -19,19.0 -20,11.0 -21,11.0 -22,10.0 -23,12.0 -24,14.0 -25,11.0 -26,17.0 -27,15.0 -28,10.0 -29,17.0 -30,10.0 -31,11.0 -32,10.0 -33,18.0 -34,12.0 -35,11.0 -36,18.0 -37,13.0 -38,11.0 -39,35.0 -40,9.0 -41,12.0 -42,13.0 -43,9.0 -44,9.0 -45,28.0 -46,10.0 -47,10.0 -48,9.0 -49,10.0 -50,10.0 -51,9.0 -52,11.0 -53,13.0 -54,13.0 -55,14.0 -56,9.0 -57,31.0 -58,64.0 -59,55.0 -60,25.0 -61,56.0 -62,40.0 -63,91.0 -64,39.0 -65,33.0 -66,53.0 -67,55.0 -68,43.0 -69,96.0 -70,50.0 -71,56.0 -72,55.0 -73,50.0 -74,64.0 -75,102.0 -76,63.0 -77,41.0 -78,88.0 -79,69.0 -80,186.0 -81,161.0 -82,106.0 -83,129.0 -84,200.0 -85,200.0 -86,200.0 -87,200.0 -88,200.0 -89,200.0 -90,200.0 -91,200.0 -92,200.0 -93,200.0 -94,200.0 -95,200.0 -96,200.0 -97,200.0 -98,200.0 -99,200.0 -100,200.0 -101,200.0 -102,200.0 -103,200.0 -104,200.0 -105,200.0 -106,200.0 -107,200.0 -108,200.0 -109,200.0 -110,200.0 -111,200.0 -112,200.0 -113,200.0 -114,200.0 -115,200.0 -116,200.0 -117,200.0 -118,200.0 -119,200.0 -120,200.0 -121,200.0 -122,200.0 -123,200.0 -124,200.0 -125,200.0 -126,200.0 -127,200.0 -128,200.0 -129,200.0 -130,200.0 -131,200.0 -132,200.0 -133,200.0 -134,200.0 -135,200.0 -136,200.0 -137,200.0 -138,200.0 -139,200.0 -140,200.0 -141,200.0 -142,200.0 -143,200.0 -144,200.0 -145,200.0 -146,200.0 -147,200.0 -148,200.0 -149,200.0 -150,200.0 -151,200.0 -152,200.0 -153,200.0 -154,200.0 -155,200.0 -156,200.0 -157,200.0 -158,200.0 -159,200.0 -160,200.0 -161,200.0 -162,200.0 -163,200.0 -164,200.0 -165,200.0 -166,200.0 -167,200.0 -168,200.0 -169,200.0 -170,200.0 -171,200.0 -172,200.0 -173,200.0 -174,200.0 -175,200.0 -176,200.0 -177,200.0 -178,200.0 -179,200.0 -180,200.0 -181,200.0 -182,200.0 -183,200.0 -184,200.0 -185,200.0 -186,200.0 -187,200.0 -188,200.0 -189,200.0 -190,200.0 -191,200.0 -192,200.0 -193,200.0 -194,200.0 -195,200.0 -196,200.0 -197,200.0 -198,200.0 -199,200.0 -200,200.0 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/config.yaml b/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/config.yaml deleted file mode 100644 index d29c9bb73e7473ca189ef2725d9366fe76b087d2..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/config.yaml +++ /dev/null @@ -1,36 +0,0 @@ -general_cfg: - algo_name: NoisyDQN - device: cpu - env_name: gym - eval_eps: 10 - eval_per_episode: 5 - load_checkpoint: false - load_path: Train_CartPole-v1_NoisyDQN - max_steps: 200 - mode: train - mp_backend: ray - n_workers: 2 - new_step_api: true - render: false - render_mode: human - save_fig: true - seed: 1 - show_fig: false - test_eps: 10 - train_eps: 220 - wrapper: null -algo_cfg: - batch_size: 64 - buffer_size: 100000 - epsilon_decay: 500 - epsilon_end: 0.01 - epsilon_start: 0.95 - gamma: 0.95 - hidden_dim: 256 - lr: 0.0001 - target_update: 4 - tau: 1.0 -env_cfg: - id: CartPole-v1 - new_step_api: true - render_mode: null diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/logs/log.txt b/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/logs/log.txt deleted file mode 100644 index 6b3da269d53cf665f2b39c0724abf72a91d151aa..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/logs/log.txt +++ /dev/null @@ -1,44 +0,0 @@ -2023-04-14 10:13:51 - r - INFO: - Hyperparameters: -2023-04-14 10:13:51 - r - INFO: - ================================================================================ -2023-04-14 10:13:51 - r - INFO: - Name Value Type -2023-04-14 10:13:51 - r - INFO: - env_name gym -2023-04-14 10:13:51 - r - INFO: - new_step_api 1 -2023-04-14 10:13:51 - r - INFO: - wrapper None -2023-04-14 10:13:51 - r - INFO: - render 0 -2023-04-14 10:13:51 - r - INFO: - render_mode None -2023-04-14 10:13:51 - r - INFO: - algo_name NoisyDQN -2023-04-14 10:13:51 - r - INFO: - mode train -2023-04-14 10:13:51 - r - INFO: - mp_backend ray -2023-04-14 10:13:51 - r - INFO: - seed 1 -2023-04-14 10:13:51 - r - INFO: - device cpu -2023-04-14 10:13:51 - r - INFO: - train_eps 220 -2023-04-14 10:13:51 - r - INFO: - test_eps 10 -2023-04-14 10:13:51 - r - INFO: - eval_eps 10 -2023-04-14 10:13:51 - r - INFO: - eval_per_episode 5 -2023-04-14 10:13:51 - r - INFO: - max_steps 200 -2023-04-14 10:13:51 - r - INFO: - load_checkpoint 0 -2023-04-14 10:13:51 - r - INFO: - load_path Train_CartPole-v1_NoisyDQN -2023-04-14 10:13:51 - r - INFO: - show_fig 0 -2023-04-14 10:13:51 - r - INFO: - save_fig 1 -2023-04-14 10:13:51 - r - INFO: - n_workers 2 -2023-04-14 10:13:51 - r - INFO: - epsilon_start 0.95 -2023-04-14 10:13:51 - r - INFO: - tau 1.0 -2023-04-14 10:13:51 - r - INFO: - epsilon_end 0.01 -2023-04-14 10:13:51 - r - INFO: - epsilon_decay 500 -2023-04-14 10:13:51 - r - INFO: - hidden_dim 256 -2023-04-14 10:13:51 - r - INFO: - gamma 0.95 -2023-04-14 10:13:51 - r - INFO: - lr 0.0001 -2023-04-14 10:13:51 - r - INFO: - buffer_size 100000 -2023-04-14 10:13:51 - r - INFO: - batch_size 64 -2023-04-14 10:13:51 - r - INFO: - target_update 4 -2023-04-14 10:13:51 - r - INFO: - id CartPole-v1 -2023-04-14 10:13:51 - r - INFO: - task_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230414-101351 -2023-04-14 10:13:51 - r - INFO: - res_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230414-101351/results -2023-04-14 10:13:51 - r - INFO: - log_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230414-101351/logs -2023-04-14 10:13:51 - r - INFO: - traj_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230414-101351/traj -2023-04-14 10:13:51 - r - INFO: - video_dir /media/disk/gsc/joyrl-offline/tasks/Train_gym_NoisyDQN_20230414-101351/videos -2023-04-14 10:13:51 - r - INFO: - ================================================================================ -2023-04-14 10:13:54 - r - INFO: - n_states: 4, n_actions: 2 -2023-04-14 10:13:54 - r - INFO: - Start training! -2023-04-14 10:13:54 - r - INFO: - Env: gym, Algorithm: NoisyDQN, Device: cpu -2023-04-14 10:18:26 - r - INFO: - Finish training! diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/models/checkpoint.pt b/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/models/checkpoint.pt deleted file mode 100644 index bd194c325cd70fff6bcfdbd0f6494201e76888ae..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/models/checkpoint.pt +++ /dev/null @@ -1,3 +0,0 @@ -version https://git-lfs.github.com/spec/v1 -oid sha256:d5596bf84dd1a6b891f4a5790c45ae7c9f937bf6471c2218350adb67e6787b2d -size 804667 diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/results/learning_curve.png b/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/results/learning_curve.png deleted file mode 100644 index 2dfd5c93cc214f70ae2cfea6470b44c8d6c347cb..0000000000000000000000000000000000000000 Binary files a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/results/learning_curve.png and /dev/null differ diff --git a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/results/res.csv b/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/results/res.csv deleted file mode 100644 index db5417b7f2c86455779b86188e2aee2581baad15..0000000000000000000000000000000000000000 --- a/CartPole-v1/Train_CartPole-v1_NoisyDQN_ray_20230414-101351/results/res.csv +++ /dev/null @@ -1,221 +0,0 @@ -episodes,rewards -0,18.0 -1,18.0 -2,19.0 -3,28.0 -4,17.0 -5,15.0 -6,13.0 -7,15.0 -8,38.0 -9,31.0 -10,11.0 -11,31.0 -12,10.0 -13,17.0 -14,14.0 -15,13.0 -16,21.0 -17,10.0 -18,10.0 -19,10.0 -20,11.0 -21,13.0 -22,19.0 -23,12.0 -24,13.0 -25,18.0 -26,15.0 -27,13.0 -28,14.0 -29,12.0 -30,11.0 -31,12.0 -32,14.0 -33,9.0 -34,10.0 -35,16.0 -36,13.0 -37,15.0 -38,12.0 -39,11.0 -40,14.0 -41,28.0 -42,16.0 -43,11.0 -44,12.0 -45,11.0 -46,10.0 -47,13.0 -48,10.0 -49,9.0 -50,13.0 -51,11.0 -52,12.0 -53,10.0 -54,9.0 -55,12.0 -56,10.0 -57,15.0 -58,12.0 -59,12.0 -60,9.0 -61,16.0 -62,15.0 -63,16.0 -64,11.0 -65,18.0 -66,14.0 -67,12.0 -68,17.0 -69,13.0 -70,18.0 -71,15.0 -72,19.0 -73,26.0 -74,39.0 -75,28.0 -76,25.0 -77,66.0 -78,24.0 -79,29.0 -80,24.0 -81,25.0 -82,24.0 -83,20.0 -84,46.0 -85,37.0 -86,16.0 -87,24.0 -88,29.0 -89,86.0 -90,128.0 -91,85.0 -92,79.0 -93,58.0 -94,94.0 -95,57.0 -96,53.0 -97,36.0 -98,65.0 -99,64.0 -100,56.0 -101,58.0 -102,200.0 -103,123.0 -104,109.0 -105,67.0 -106,107.0 -107,165.0 -108,200.0 -109,200.0 -110,200.0 -111,170.0 -112,146.0 -113,200.0 -114,200.0 -115,200.0 -116,200.0 -117,200.0 -118,200.0 -119,200.0 -120,200.0 -121,200.0 -122,200.0 -123,200.0 -124,200.0 -125,200.0 -126,200.0 -127,200.0 -128,200.0 -129,200.0 -130,200.0 -131,200.0 -132,200.0 -133,200.0 -134,200.0 -135,200.0 -136,200.0 -137,200.0 -138,200.0 -139,200.0 -140,200.0 -141,200.0 -142,200.0 -143,200.0 -144,200.0 -145,200.0 -146,200.0 -147,200.0 -148,200.0 -149,200.0 -150,200.0 -151,200.0 -152,200.0 -153,200.0 -154,200.0 -155,200.0 -156,200.0 -157,200.0 -158,200.0 -159,191.0 -160,191.0 -161,190.0 -162,192.0 -163,200.0 -164,199.0 -165,200.0 -166,200.0 -167,200.0 -168,200.0 -169,200.0 -170,200.0 -171,200.0 -172,200.0 -173,200.0 -174,200.0 -175,200.0 -176,200.0 -177,200.0 -178,200.0 -179,200.0 -180,200.0 -181,200.0 -182,200.0 -183,200.0 -184,200.0 -185,200.0 -186,200.0 -187,200.0 -188,200.0 -189,200.0 -190,200.0 -191,200.0 -192,200.0 -193,200.0 -194,200.0 -195,200.0 -196,200.0 -197,200.0 -198,200.0 -199,200.0 -200,200.0 -201,200.0 -202,200.0 -203,200.0 -204,200.0 -205,200.0 -206,200.0 -207,200.0 -208,200.0 -209,200.0 -210,200.0 -211,200.0 -212,200.0 -213,200.0 -214,200.0 -215,200.0 -216,200.0 -217,200.0 -218,200.0 -219,200.0 diff --git a/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/config.yaml b/ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/config.yaml similarity index 100% rename from Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/config.yaml rename to ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/config.yaml diff --git a/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/logs/log.txt b/ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/logs/log.txt similarity index 100% rename from Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/logs/log.txt rename to ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/logs/log.txt diff --git a/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/models/checkpoint.pt b/ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/models/checkpoint.pt similarity index 100% rename from Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/models/checkpoint.pt rename to ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/models/checkpoint.pt diff --git a/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/learning_curve.png b/ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/learning_curve.png similarity index 100% rename from Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/learning_curve.png rename to ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/learning_curve.png diff --git a/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/res.csv b/ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/res.csv similarity index 100% rename from Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/res.csv rename to ClassControl/Acrobot-v1/Test_Acrobot-v1_DQN_20221122-120610/results/res.csv diff --git a/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/config.yaml b/ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/config.yaml similarity index 100% rename from Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/config.yaml rename to ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/config.yaml diff --git a/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/logs/log.txt b/ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/logs/log.txt similarity index 100% rename from Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/logs/log.txt rename to ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/logs/log.txt diff --git a/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/models/checkpoint.pt b/ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/models/checkpoint.pt similarity index 100% rename from Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/models/checkpoint.pt rename to ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/models/checkpoint.pt diff --git a/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/learning_curve.png b/ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/learning_curve.png similarity index 100% rename from Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/learning_curve.png rename to ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/learning_curve.png diff --git a/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/res.csv b/ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/res.csv similarity index 100% rename from Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/res.csv rename to ClassControl/Acrobot-v1/Train_Acrobot-v1_DQN_20221122-120436/results/res.csv diff --git a/ClassControl/CartPole-v1/.DS_Store b/ClassControl/CartPole-v1/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..19d4a14a75fe8cdc2ec8ffc28682133766916942 Binary files /dev/null and b/ClassControl/CartPole-v1/.DS_Store differ diff --git a/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/config.yaml b/ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/config.yaml similarity index 100% rename from CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/config.yaml rename to ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/config.yaml diff --git a/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/logs/log.txt b/ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/logs/log.txt similarity index 100% rename from CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/logs/log.txt rename to ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/logs/log.txt diff --git a/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/learning_curve.png b/ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/learning_curve.png similarity index 100% rename from CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/learning_curve.png rename to ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/learning_curve.png diff --git a/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/res.csv b/ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/res.csv similarity index 100% rename from CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/res.csv rename to ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/results/res.csv diff --git a/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/traj/traj.pkl b/ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/traj/traj.pkl similarity index 100% rename from CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/traj/traj.pkl rename to ClassControl/CartPole-v1/Collect_CartPole-v1_PPO_20221206-173222/traj/traj.pkl diff --git a/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/actor_checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/actor_checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/actor_checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/actor_checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/critic_checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/critic_checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/critic_checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/models/critic_checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_A2C_20221204-003659/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/actor_checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/actor_checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/actor_checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/actor_checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/critic_checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/critic_checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/critic_checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/models/critic_checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_A3C_20230111-132929/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_BC_20230319-190943/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_BC_20230319-190943/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/models/model.pth b/ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/models/model.pth similarity index 100% rename from CartPole-v1/Test_CartPole-v1_BC_20230319-190943/models/model.pth rename to ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/models/model.pth diff --git a/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/tb_logs/events.out.tfevents.1679224183.dell-Precision-5820-Tower.15407.0 b/ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/tb_logs/events.out.tfevents.1679224183.dell-Precision-5820-Tower.15407.0 similarity index 100% rename from CartPole-v1/Test_CartPole-v1_BC_20230319-190943/tb_logs/events.out.tfevents.1679224183.dell-Precision-5820-Tower.15407.0 rename to ClassControl/CartPole-v1/Test_CartPole-v1_BC_20230319-190943/tb_logs/events.out.tfevents.1679224183.dell-Precision-5820-Tower.15407.0 diff --git a/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_C51_20230114-222728/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_C51_20230114-222728/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_C51_20230114-222728/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_C51_20230114-222728/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_CQL_20230409-160145/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_DRQN_20230204-223710/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/actor.pth b/ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/actor.pth similarity index 100% rename from CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/actor.pth rename to ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/actor.pth diff --git a/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/critic.pth b/ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/critic.pth similarity index 100% rename from CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/critic.pth rename to ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/models/critic.pth diff --git a/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_GAIL_20221207-163649/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_NoisyDQN_20230318-162630/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/tb_logs/events.out.tfevents.1680275682.DESKTOP-H34HQIQ.290376.0 b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/tb_logs/events.out.tfevents.1680275682.DESKTOP-H34HQIQ.290376.0 similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/tb_logs/events.out.tfevents.1680275682.DESKTOP-H34HQIQ.290376.0 rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/tb_logs/events.out.tfevents.1680275682.DESKTOP-H34HQIQ.290376.0 diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_NoisyDQN_mp_20230413-221012/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_PER_DQN_ray_20230415-220540/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_NoisyDQN_ray_20230414-101926/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_REINFORCE_20221203-143430/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_20230331-231442/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_RainbowDQN_20230114-222446/results/res.csv diff --git a/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/config.yaml b/ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/config.yaml similarity index 100% rename from CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/config.yaml rename to ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/config.yaml diff --git a/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/logs/log.txt b/ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/logs/log.txt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/logs/log.txt rename to ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/logs/log.txt diff --git a/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/models/checkpoint.pt b/ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/models/checkpoint.pt rename to ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/models/checkpoint.pt diff --git a/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/learning_curve.png b/ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/learning_curve.png similarity index 100% rename from CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/learning_curve.png rename to ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/learning_curve.png diff --git a/CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/res.csv b/ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/res.csv similarity index 100% rename from CartPole-v1/Test_CartPole-v1_PER_DQN_mp_20230415-215147/results/res.csv rename to ClassControl/CartPole-v1/Test_CartPole-v1_SAC_D_20230305-113238/results/res.csv diff --git a/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/config.yaml b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/config.yaml similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/config.yaml rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/config.yaml diff --git a/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/logs/log.txt b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/logs/log.txt similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/logs/log.txt rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/logs/log.txt diff --git a/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/results/trajs_0.pkl b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/results/trajs_0.pkl similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/results/trajs_0.pkl rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/results/trajs_0.pkl diff --git a/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/interact/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.0 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/interact/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.0 similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/interact/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.0 rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/interact/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.0 diff --git a/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/model/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.1 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/model/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.1 similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/model/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.1 rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/tb_logs/model/events.out.tfevents.1684156766.DESKTOP-H34HQIQ.16348.1 diff --git a/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/videos/video.gif b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/videos/video.gif similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/videos/video.gif rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DQN_20230515-211926/videos/video.gif diff --git a/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/config.yaml b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/config.yaml similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/config.yaml rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/config.yaml diff --git a/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/logs/log.txt b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/logs/log.txt similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/logs/log.txt rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/logs/log.txt diff --git a/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/interact/events.out.tfevents.1684209185.JMac.local.52313.0 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/interact/events.out.tfevents.1684209185.JMac.local.52313.0 similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/interact/events.out.tfevents.1684209185.JMac.local.52313.0 rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/interact/events.out.tfevents.1684209185.JMac.local.52313.0 diff --git a/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/model/events.out.tfevents.1684209185.JMac.local.52313.1 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/model/events.out.tfevents.1684209185.JMac.local.52313.1 similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/model/events.out.tfevents.1684209185.JMac.local.52313.1 rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_DoubleDQN_20230516-115305/tb_logs/model/events.out.tfevents.1684209185.JMac.local.52313.1 diff --git a/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/config.yaml b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..960b350d3388aeafb57bb6a9f610ccfcb3c519aa --- /dev/null +++ b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/config.yaml @@ -0,0 +1,47 @@ +general_cfg: + algo_name: NoisyDQN + collect_traj: false + device: cpu + env_name: gym + load_checkpoint: true + load_model_step: best + load_path: Train_single_CartPole-v1_NoisyDQN_20230518-133737 + max_episode: 10 + max_step: 200 + mode: test + model_save_fre: 500 + mp_backend: single + n_learners: 1 + n_workers: 2 + online_eval: true + online_eval_episode: 10 + seed: 1 + share_buffer: true +algo_cfg: + batch_size: 64 + buffer_size: 100000 + buffer_type: REPLAY_QUE + epsilon_decay: 500 + epsilon_end: 0.01 + epsilon_start: 0.95 + gamma: 0.99 + lr: 0.0001 + target_update: 4 + value_layers: + - activation: relu + layer_size: + - 256 + layer_type: noisy_linear + std_init: 0.4 + - activation: relu + layer_size: + - 256 + layer_type: noisy_linear + std_init: 0.4 +env_cfg: + id: CartPole-v1 + ignore_params: + - wrapper + - ignore_params + render_mode: null + wrapper: null diff --git a/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/logs/log.txt b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/logs/log.txt new file mode 100644 index 0000000000000000000000000000000000000000..25e2a2849ab6f7ccb66bb0cea27e40f4a148128e --- /dev/null +++ b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/logs/log.txt @@ -0,0 +1,57 @@ +2023-05-18 13:38:24 - SimpleLog - INFO: - General Configs: +2023-05-18 13:38:24 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:38:24 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:38:24 - SimpleLog - INFO: - env_name gym +2023-05-18 13:38:24 - SimpleLog - INFO: - algo_name NoisyDQN +2023-05-18 13:38:24 - SimpleLog - INFO: - mode test +2023-05-18 13:38:24 - SimpleLog - INFO: - device cpu +2023-05-18 13:38:24 - SimpleLog - INFO: - seed 1 +2023-05-18 13:38:24 - SimpleLog - INFO: - max_episode 10 +2023-05-18 13:38:24 - SimpleLog - INFO: - max_step 200 +2023-05-18 13:38:24 - SimpleLog - INFO: - collect_traj 0 +2023-05-18 13:38:24 - SimpleLog - INFO: - mp_backend single +2023-05-18 13:38:24 - SimpleLog - INFO: - n_workers 2 +2023-05-18 13:38:24 - SimpleLog - INFO: - n_learners 1 +2023-05-18 13:38:24 - SimpleLog - INFO: - share_buffer 1 +2023-05-18 13:38:24 - SimpleLog - INFO: - online_eval 1 +2023-05-18 13:38:24 - SimpleLog - INFO: - online_eval_episode 10 +2023-05-18 13:38:24 - SimpleLog - INFO: - model_save_fre 500 +2023-05-18 13:38:24 - SimpleLog - INFO: - load_checkpoint 1 +2023-05-18 13:38:24 - SimpleLog - INFO: - load_path Train_single_CartPole-v1_NoisyDQN_20230518-133737 +2023-05-18 13:38:24 - SimpleLog - INFO: - load_model_step best +2023-05-18 13:38:24 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:38:24 - SimpleLog - INFO: - Algo Configs: +2023-05-18 13:38:24 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:38:24 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:38:24 - SimpleLog - INFO: - epsilon_start 0.95 +2023-05-18 13:38:24 - SimpleLog - INFO: - epsilon_end 0.01 +2023-05-18 13:38:24 - SimpleLog - INFO: - epsilon_decay 500 +2023-05-18 13:38:24 - SimpleLog - INFO: - gamma 0.99 +2023-05-18 13:38:24 - SimpleLog - INFO: - lr 0.0001 +2023-05-18 13:38:24 - SimpleLog - INFO: - buffer_size 100000 +2023-05-18 13:38:24 - SimpleLog - INFO: - batch_size 64 +2023-05-18 13:38:24 - SimpleLog - INFO: - target_update 4 +2023-05-18 13:38:24 - SimpleLog - INFO: - value_layers [{'layer_type': 'noisy_linear', 'layer_size': [256], 'activation': 'relu', 'std_init': 0.4}, {'layer_type': 'noisy_linear', 'layer_size': [256], 'activation': 'relu', 'std_init': 0.4}] +2023-05-18 13:38:24 - SimpleLog - INFO: - buffer_type REPLAY_QUE +2023-05-18 13:38:24 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:38:24 - SimpleLog - INFO: - Env Configs: +2023-05-18 13:38:24 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:38:24 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:38:24 - SimpleLog - INFO: - id CartPole-v1 +2023-05-18 13:38:24 - SimpleLog - INFO: - render_mode None +2023-05-18 13:38:24 - SimpleLog - INFO: - wrapper None +2023-05-18 13:38:24 - SimpleLog - INFO: - ignore_params ['wrapper', 'ignore_params'] +2023-05-18 13:38:24 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:38:24 - SimpleLog - INFO: - obs_space: Box([-4.8000002e+00 -3.4028235e+38 -4.1887903e-01 -3.4028235e+38], [4.8000002e+00 3.4028235e+38 4.1887903e-01 3.4028235e+38], (4,), float32), n_actions: Discrete(2) +2023-05-18 13:38:24 - SimpleLog - INFO: - Start testing! +2023-05-18 13:38:24 - SimpleLog - INFO: - episode: 0, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:24 - SimpleLog - INFO: - episode: 1, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:24 - SimpleLog - INFO: - episode: 2, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:24 - SimpleLog - INFO: - episode: 3, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:24 - SimpleLog - INFO: - episode: 4, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:25 - SimpleLog - INFO: - episode: 5, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:25 - SimpleLog - INFO: - episode: 6, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:25 - SimpleLog - INFO: - episode: 7, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:25 - SimpleLog - INFO: - episode: 8, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:25 - SimpleLog - INFO: - episode: 9, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:38:25 - SimpleLog - INFO: - Finish testing! total time consumed: 0.26s diff --git a/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/tb_logs/interact/events.out.tfevents.1684388304.JMac.local.86491.0 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/tb_logs/interact/events.out.tfevents.1684388304.JMac.local.86491.0 new file mode 100644 index 0000000000000000000000000000000000000000..f86a02769b3b3d06635d5a78555496f79857f0d6 --- /dev/null +++ b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/tb_logs/interact/events.out.tfevents.1684388304.JMac.local.86491.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a888c1468be41447e5aec55b8e1cac6bb28792c9a6d11eb37f43f8db1a1ec315 +size 1056 diff --git a/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/tb_logs/model/events.out.tfevents.1684388304.JMac.local.86491.1 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/tb_logs/model/events.out.tfevents.1684388304.JMac.local.86491.1 new file mode 100644 index 0000000000000000000000000000000000000000..c48f7fbcf9258a8ac94085c3de6ebdabfd11050a --- /dev/null +++ b/ClassControl/CartPole-v1/Test_single_CartPole-v1_NoisyDQN_20230518-133824/tb_logs/model/events.out.tfevents.1684388304.JMac.local.86491.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5ef74ab61b4fd87898bdb34cad1df3bbf05d7edf30ae81504f7d09bb4f75ffd +size 40 diff --git a/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/config.yaml b/ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/config.yaml similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/config.yaml rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/config.yaml diff --git a/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/logs/log.txt b/ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/logs/log.txt similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/logs/log.txt rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/logs/log.txt diff --git a/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/interact/events.out.tfevents.1684302533.JMac.local.61381.0 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/interact/events.out.tfevents.1684302533.JMac.local.61381.0 similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/interact/events.out.tfevents.1684302533.JMac.local.61381.0 rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/interact/events.out.tfevents.1684302533.JMac.local.61381.0 diff --git a/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/model/events.out.tfevents.1684302533.JMac.local.61381.1 b/ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/model/events.out.tfevents.1684302533.JMac.local.61381.1 similarity index 100% rename from CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/model/events.out.tfevents.1684302533.JMac.local.61381.1 rename to ClassControl/CartPole-v1/Test_single_CartPole-v1_PPO_20230517-134853/tb_logs/model/events.out.tfevents.1684302533.JMac.local.61381.1 diff --git a/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/actor_checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/actor_checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/actor_checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/actor_checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/critic_checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/critic_checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/critic_checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/models/critic_checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_A2C_20221204-003439/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/actor_checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/actor_checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/actor_checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/actor_checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/critic_checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/critic_checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/critic_checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/models/critic_checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_A3C_20230111-132542/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_BC_20230319-190431/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_BC_20230319-190431/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/models/model.pth b/ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/models/model.pth similarity index 100% rename from CartPole-v1/Train_CartPole-v1_BC_20230319-190431/models/model.pth rename to ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/models/model.pth diff --git a/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/tb_logs/events.out.tfevents.1679223871.dell-Precision-5820-Tower.11356.0 b/ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/tb_logs/events.out.tfevents.1679223871.dell-Precision-5820-Tower.11356.0 similarity index 100% rename from CartPole-v1/Train_CartPole-v1_BC_20230319-190431/tb_logs/events.out.tfevents.1679223871.dell-Precision-5820-Tower.11356.0 rename to ClassControl/CartPole-v1/Train_CartPole-v1_BC_20230319-190431/tb_logs/events.out.tfevents.1679223871.dell-Precision-5820-Tower.11356.0 diff --git a/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_C51_20230114-222523/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_C51_20230114-222523/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_C51_20230114-222523/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_C51_20230114-222523/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_CQL_20230408-183652/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_DRQN_20230204-223146/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/actor.pth b/ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/actor.pth similarity index 100% rename from CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/actor.pth rename to ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/actor.pth diff --git a/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/critic.pth b/ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/critic.pth similarity index 100% rename from CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/critic.pth rename to ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/models/critic.pth diff --git a/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_GAIL_20221207-160945/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/tb_logs/events.out.tfevents.1680277069.DESKTOP-H34HQIQ.305216.0 b/ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/tb_logs/events.out.tfevents.1680277069.DESKTOP-H34HQIQ.305216.0 similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/tb_logs/events.out.tfevents.1680277069.DESKTOP-H34HQIQ.305216.0 rename to ClassControl/CartPole-v1/Train_CartPole-v1_PERQue_DQN_20230331-233749/tb_logs/events.out.tfevents.1680277069.DESKTOP-H34HQIQ.305216.0 diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/tb_logs/events.out.tfevents.1680274695.DESKTOP-H34HQIQ.317208.0 b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/tb_logs/events.out.tfevents.1680274695.DESKTOP-H34HQIQ.317208.0 similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/tb_logs/events.out.tfevents.1680274695.DESKTOP-H34HQIQ.317208.0 rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_20230331-225815/tb_logs/events.out.tfevents.1680274695.DESKTOP-H34HQIQ.317208.0 diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_mp__20230415-215002/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_PER_DQN_ray_20230415-215738/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/actor.pth b/ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/actor.pth similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/actor.pth rename to ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/actor.pth diff --git a/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/critic.pth b/ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/critic.pth similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/critic.pth rename to ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/models/critic.pth diff --git a/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_PPO-KL_20221217-204003/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_REINFORCE_20221203-143307/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_RainbowDQN_20230114-222012/results/res.csv diff --git a/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/config.yaml b/ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/config.yaml similarity index 100% rename from CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/config.yaml rename to ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/config.yaml diff --git a/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/logs/log.txt b/ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/logs/log.txt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/logs/log.txt rename to ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/logs/log.txt diff --git a/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/models/checkpoint.pt b/ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/models/checkpoint.pt similarity index 100% rename from CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/models/checkpoint.pt rename to ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/models/checkpoint.pt diff --git a/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/learning_curve.png b/ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/learning_curve.png similarity index 100% rename from CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/learning_curve.png rename to ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/learning_curve.png diff --git a/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/res.csv b/ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/res.csv similarity index 100% rename from CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/res.csv rename to ClassControl/CartPole-v1/Train_CartPole-v1_SAC_D_20230305-112849/results/res.csv diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/config.yaml b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/config.yaml similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/config.yaml rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/config.yaml diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/logs/log.txt b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/logs/log.txt similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/logs/log.txt rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/logs/log.txt diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/1500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/2500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/3500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/4500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/5500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/6500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/7000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/7000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/7000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/7000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/best b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/best similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/best rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/models/best diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.0 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.0 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.0 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.0 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.0 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/interact/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.0 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.1 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.1 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160356.DESKTOP-H34HQIQ.63896.1 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.1 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.1 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DQN_20230515-221916/tb_logs/model/events.out.tfevents.1684160363.DESKTOP-H34HQIQ.19952.1 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/config.yaml b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/config.yaml similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/config.yaml rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/config.yaml diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/logs/log.txt b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/logs/log.txt similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/logs/log.txt rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/logs/log.txt diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/1500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/2500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/3500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/best b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/best similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/best rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/models/best diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209086.JMac.local.52110.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209086.JMac.local.52110.0 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209086.JMac.local.52110.0 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209086.JMac.local.52110.0 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209096.JMac.local.52161.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209096.JMac.local.52161.0 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209096.JMac.local.52161.0 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/interact/events.out.tfevents.1684209096.JMac.local.52161.0 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209086.JMac.local.52110.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209086.JMac.local.52110.1 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209086.JMac.local.52110.1 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209086.JMac.local.52110.1 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209096.JMac.local.52161.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209096.JMac.local.52161.1 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209096.JMac.local.52161.1 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DoubleDQN_20230516-115126/tb_logs/model/events.out.tfevents.1684209096.JMac.local.52161.1 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/config.yaml b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/config.yaml similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/config.yaml rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/config.yaml diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/logs/log.txt b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/logs/log.txt similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/logs/log.txt rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/logs/log.txt diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/10500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/1500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/2500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/3500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/4500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/5500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/6500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/7500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/8500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9000 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9000 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9000 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9500 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9500 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/9500 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/best b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/best similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/best rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/models/best diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.0 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.0 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.0 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.0 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.0 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/interact/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.0 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.1 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.1 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334489.DESKTOP-H34HQIQ.80856.1 diff --git a/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.1 similarity index 100% rename from CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.1 rename to ClassControl/CartPole-v1/Train_ray_CartPole-v1_DuelingDQN_20230517-224129/tb_logs/model/events.out.tfevents.1684334497.DESKTOP-H34HQIQ.84100.1 diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/.DS_Store b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/.DS_Store new file mode 100644 index 0000000000000000000000000000000000000000..b8ede2ae7112d7ae2b38866a49526a0dd67f83de Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/.DS_Store differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/config.yaml b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..29eed4a9435ccc53d4b62240273577f56250a92d --- /dev/null +++ b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/config.yaml @@ -0,0 +1,47 @@ +general_cfg: + algo_name: NoisyDQN + collect_traj: false + device: cpu + env_name: gym + load_checkpoint: false + load_model_step: best + load_path: Train_single_CartPole-v1_NoisyDQN_20230518-133737 + max_episode: 100 + max_step: 200 + mode: train + model_save_fre: 500 + mp_backend: ray + n_learners: 1 + n_workers: 2 + online_eval: true + online_eval_episode: 10 + seed: 1 + share_buffer: true +algo_cfg: + batch_size: 64 + buffer_size: 100000 + buffer_type: REPLAY_QUE + epsilon_decay: 500 + epsilon_end: 0.01 + epsilon_start: 0.95 + gamma: 0.99 + lr: 0.0001 + target_update: 4 + value_layers: + - activation: relu + layer_size: + - 256 + layer_type: noisy_linear + std_init: 0.4 + - activation: relu + layer_size: + - 256 + layer_type: noisy_linear + std_init: 0.4 +env_cfg: + id: CartPole-v1 + ignore_params: + - wrapper + - ignore_params + render_mode: null + wrapper: null diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/logs/log.txt b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/logs/log.txt new file mode 100644 index 0000000000000000000000000000000000000000..f273aaccf27603d3b2207b8e4e9b79b3d5f6be55 --- /dev/null +++ b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/logs/log.txt @@ -0,0 +1,168 @@ +2023-05-18 13:39:47 - SimpleLog - INFO: - General Configs: +2023-05-18 13:39:47 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:39:47 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:39:47 - SimpleLog - INFO: - env_name gym +2023-05-18 13:39:47 - SimpleLog - INFO: - algo_name NoisyDQN +2023-05-18 13:39:47 - SimpleLog - INFO: - mode train +2023-05-18 13:39:47 - SimpleLog - INFO: - device cpu +2023-05-18 13:39:47 - SimpleLog - INFO: - seed 1 +2023-05-18 13:39:47 - SimpleLog - INFO: - max_episode 100 +2023-05-18 13:39:47 - SimpleLog - INFO: - max_step 200 +2023-05-18 13:39:47 - SimpleLog - INFO: - collect_traj 0 +2023-05-18 13:39:47 - SimpleLog - INFO: - mp_backend ray +2023-05-18 13:39:47 - SimpleLog - INFO: - n_workers 2 +2023-05-18 13:39:47 - SimpleLog - INFO: - n_learners 1 +2023-05-18 13:39:47 - SimpleLog - INFO: - share_buffer 1 +2023-05-18 13:39:47 - SimpleLog - INFO: - online_eval 1 +2023-05-18 13:39:47 - SimpleLog - INFO: - online_eval_episode 10 +2023-05-18 13:39:47 - SimpleLog - INFO: - model_save_fre 500 +2023-05-18 13:39:47 - SimpleLog - INFO: - load_checkpoint 0 +2023-05-18 13:39:47 - SimpleLog - INFO: - load_path Train_single_CartPole-v1_NoisyDQN_20230518-133737 +2023-05-18 13:39:47 - SimpleLog - INFO: - load_model_step best +2023-05-18 13:39:47 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:39:47 - SimpleLog - INFO: - Algo Configs: +2023-05-18 13:39:47 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:39:47 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:39:47 - SimpleLog - INFO: - epsilon_start 0.95 +2023-05-18 13:39:47 - SimpleLog - INFO: - epsilon_end 0.01 +2023-05-18 13:39:47 - SimpleLog - INFO: - epsilon_decay 500 +2023-05-18 13:39:47 - SimpleLog - INFO: - gamma 0.99 +2023-05-18 13:39:47 - SimpleLog - INFO: - lr 0.0001 +2023-05-18 13:39:47 - SimpleLog - INFO: - buffer_size 100000 +2023-05-18 13:39:47 - SimpleLog - INFO: - batch_size 64 +2023-05-18 13:39:47 - SimpleLog - INFO: - target_update 4 +2023-05-18 13:39:47 - SimpleLog - INFO: - value_layers [{'layer_type': 'noisy_linear', 'layer_size': [256], 'activation': 'relu', 'std_init': 0.4}, {'layer_type': 'noisy_linear', 'layer_size': [256], 'activation': 'relu', 'std_init': 0.4}] +2023-05-18 13:39:47 - SimpleLog - INFO: - buffer_type REPLAY_QUE +2023-05-18 13:39:47 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:39:47 - SimpleLog - INFO: - Env Configs: +2023-05-18 13:39:47 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:39:47 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:39:47 - SimpleLog - INFO: - id CartPole-v1 +2023-05-18 13:39:47 - SimpleLog - INFO: - render_mode None +2023-05-18 13:39:47 - SimpleLog - INFO: - wrapper None +2023-05-18 13:39:47 - SimpleLog - INFO: - ignore_params ['wrapper', 'ignore_params'] +2023-05-18 13:39:47 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:39:54 - SimpleLog - INFO: - obs_space: Box([-4.8000002e+00 -3.4028235e+38 -4.1887903e-01 -3.4028235e+38], [4.8000002e+00 3.4028235e+38 4.1887903e-01 3.4028235e+38], (4,), float32), n_actions: Discrete(2) +2023-05-18 13:39:59 - RayLog - INFO: - Worker 0 finished episode 0 with reward 14.0 in 14 steps +2023-05-18 13:39:59 - RayLog - INFO: - Worker 1 finished episode 0 with reward 22.0 in 22 steps +2023-05-18 13:40:01 - RayLog - INFO: - Worker 1 finished episode 2 with reward 33.0 in 33 steps +2023-05-18 13:40:01 - RayLog - INFO: - Worker 0 finished episode 2 with reward 38.0 in 38 steps +2023-05-18 13:40:01 - RayLog - INFO: - Worker 0 finished episode 4 with reward 15.0 in 15 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 0 finished episode 5 with reward 26.0 in 26 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 1 finished episode 3 with reward 53.0 in 53 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 0 finished episode 6 with reward 11.0 in 11 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 1 finished episode 7 with reward 12.0 in 12 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 0 finished episode 8 with reward 14.0 in 14 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 1 finished episode 9 with reward 13.0 in 13 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 0 finished episode 10 with reward 12.0 in 12 steps +2023-05-18 13:40:02 - RayLog - INFO: - Worker 1 finished episode 11 with reward 10.0 in 10 steps +2023-05-18 13:40:03 - RayLog - INFO: - Worker 0 finished episode 12 with reward 9.0 in 9 steps +2023-05-18 13:40:03 - RayLog - INFO: - Worker 1 finished episode 13 with reward 12.0 in 12 steps +2023-05-18 13:40:03 - RayLog - INFO: - Worker 0 finished episode 14 with reward 11.0 in 11 steps +2023-05-18 13:40:03 - RayLog - INFO: - Worker 1 finished episode 15 with reward 11.0 in 11 steps +2023-05-18 13:40:03 - RayLog - INFO: - Worker 0 finished episode 16 with reward 9.0 in 9 steps +2023-05-18 13:40:03 - RayLog - INFO: - Worker 1 finished episode 17 with reward 20.0 in 20 steps +2023-05-18 13:40:03 - RayLog - INFO: - Worker 0 finished episode 18 with reward 20.0 in 20 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 0 finished episode 20 with reward 12.0 in 12 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 0 finished episode 21 with reward 13.0 in 13 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 1 finished episode 19 with reward 31.0 in 31 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 0 finished episode 22 with reward 10.0 in 10 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 1 finished episode 23 with reward 9.0 in 9 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 0 finished episode 24 with reward 12.0 in 12 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 1 finished episode 25 with reward 11.0 in 11 steps +2023-05-18 13:40:04 - RayLog - INFO: - Worker 0 finished episode 26 with reward 12.0 in 12 steps +2023-05-18 13:40:05 - RayLog - INFO: - Worker 1 finished episode 27 with reward 12.0 in 12 steps +2023-05-18 13:40:05 - RayLog - INFO: - Worker 0 finished episode 28 with reward 13.0 in 13 steps +2023-05-18 13:40:05 - RayLog - INFO: - Worker 1 finished episode 29 with reward 13.0 in 13 steps +2023-05-18 13:40:05 - RayLog - INFO: - Worker 0 finished episode 30 with reward 12.0 in 12 steps +2023-05-18 13:40:05 - RayLog - INFO: - Worker 1 finished episode 31 with reward 14.0 in 14 steps +2023-05-18 13:40:05 - RayLog - INFO: - Worker 0 finished episode 32 with reward 14.0 in 14 steps +2023-05-18 13:40:07 - RayLog - INFO: - learner id: 0, update_step: 500, online_eval_reward: 10.000 +2023-05-18 13:40:07 - RayLog - INFO: - learner 0 for current update step obtain a better online_eval_reward: 10.000, save the best model! +2023-05-18 13:40:07 - RayLog - INFO: - Worker 1 finished episode 33 with reward 14.0 in 14 steps +2023-05-18 13:40:07 - RayLog - INFO: - Worker 0 finished episode 34 with reward 11.0 in 11 steps +2023-05-18 13:40:07 - RayLog - INFO: - Worker 1 finished episode 35 with reward 13.0 in 13 steps +2023-05-18 13:40:07 - RayLog - INFO: - Worker 1 finished episode 37 with reward 10.0 in 10 steps +2023-05-18 13:40:07 - RayLog - INFO: - Worker 1 finished episode 38 with reward 11.0 in 11 steps +2023-05-18 13:40:07 - RayLog - INFO: - Worker 0 finished episode 36 with reward 29.0 in 29 steps +2023-05-18 13:40:08 - RayLog - INFO: - Worker 1 finished episode 39 with reward 9.0 in 9 steps +2023-05-18 13:40:08 - RayLog - INFO: - Worker 0 finished episode 40 with reward 11.0 in 11 steps +2023-05-18 13:40:08 - RayLog - INFO: - Worker 0 finished episode 42 with reward 35.0 in 35 steps +2023-05-18 13:40:08 - RayLog - INFO: - Worker 1 finished episode 41 with reward 49.0 in 49 steps +2023-05-18 13:40:09 - RayLog - INFO: - Worker 0 finished episode 43 with reward 36.0 in 36 steps +2023-05-18 13:40:09 - RayLog - INFO: - Worker 1 finished episode 44 with reward 35.0 in 35 steps +2023-05-18 13:40:10 - RayLog - INFO: - Worker 0 finished episode 45 with reward 42.0 in 42 steps +2023-05-18 13:40:10 - RayLog - INFO: - Worker 1 finished episode 46 with reward 44.0 in 44 steps +2023-05-18 13:40:10 - RayLog - INFO: - Worker 0 finished episode 47 with reward 36.0 in 36 steps +2023-05-18 13:40:11 - RayLog - INFO: - Worker 1 finished episode 48 with reward 44.0 in 44 steps +2023-05-18 13:40:11 - RayLog - INFO: - Worker 0 finished episode 49 with reward 37.0 in 37 steps +2023-05-18 13:40:12 - RayLog - INFO: - learner id: 0, update_step: 1000, online_eval_reward: 51.000 +2023-05-18 13:40:12 - RayLog - INFO: - learner 0 for current update step obtain a better online_eval_reward: 51.000, save the best model! +2023-05-18 13:40:13 - RayLog - INFO: - Worker 0 finished episode 51 with reward 76.0 in 76 steps +2023-05-18 13:40:13 - RayLog - INFO: - Worker 1 finished episode 50 with reward 109.0 in 109 steps +2023-05-18 13:40:15 - RayLog - INFO: - Worker 0 finished episode 52 with reward 119.0 in 119 steps +2023-05-18 13:40:15 - RayLog - INFO: - Worker 1 finished episode 53 with reward 120.0 in 120 steps +2023-05-18 13:40:16 - RayLog - INFO: - Worker 0 finished episode 54 with reward 57.0 in 57 steps +2023-05-18 13:40:16 - RayLog - INFO: - Worker 1 finished episode 55 with reward 44.0 in 44 steps +2023-05-18 13:40:16 - RayLog - INFO: - learner id: 0, update_step: 1500, online_eval_reward: 53.000 +2023-05-18 13:40:16 - RayLog - INFO: - learner 0 for current update step obtain a better online_eval_reward: 53.000, save the best model! +2023-05-18 13:40:17 - RayLog - INFO: - Worker 1 finished episode 57 with reward 43.0 in 43 steps +2023-05-18 13:40:18 - RayLog - INFO: - Worker 0 finished episode 56 with reward 72.0 in 72 steps +2023-05-18 13:40:18 - RayLog - INFO: - Worker 1 finished episode 58 with reward 35.0 in 35 steps +2023-05-18 13:40:19 - RayLog - INFO: - Worker 1 finished episode 60 with reward 48.0 in 48 steps +2023-05-18 13:40:19 - RayLog - INFO: - Worker 0 finished episode 59 with reward 64.0 in 64 steps +2023-05-18 13:40:19 - RayLog - INFO: - Worker 1 finished episode 61 with reward 36.0 in 36 steps +2023-05-18 13:40:20 - RayLog - INFO: - Worker 0 finished episode 62 with reward 57.0 in 57 steps +2023-05-18 13:40:20 - RayLog - INFO: - Worker 1 finished episode 63 with reward 42.0 in 42 steps +2023-05-18 13:40:21 - RayLog - INFO: - learner id: 0, update_step: 2000, online_eval_reward: 143.000 +2023-05-18 13:40:21 - RayLog - INFO: - learner 0 for current update step obtain a better online_eval_reward: 143.000, save the best model! +2023-05-18 13:40:23 - RayLog - INFO: - Worker 1 finished episode 65 with reward 100.0 in 100 steps +2023-05-18 13:40:23 - RayLog - INFO: - Worker 0 finished episode 64 with reward 153.0 in 153 steps +2023-05-18 13:40:24 - RayLog - INFO: - Worker 1 finished episode 66 with reward 61.0 in 61 steps +2023-05-18 13:40:25 - RayLog - INFO: - Worker 0 finished episode 67 with reward 111.0 in 111 steps +2023-05-18 13:40:26 - RayLog - INFO: - Worker 1 finished episode 68 with reward 103.0 in 103 steps +2023-05-18 13:40:27 - RayLog - INFO: - learner id: 0, update_step: 2500, online_eval_reward: 85.000 +2023-05-18 13:40:28 - RayLog - INFO: - Worker 1 finished episode 70 with reward 127.0 in 127 steps +2023-05-18 13:40:29 - RayLog - INFO: - Worker 0 finished episode 69 with reward 164.0 in 164 steps +2023-05-18 13:40:32 - RayLog - INFO: - learner id: 0, update_step: 3000, online_eval_reward: 74.000 +2023-05-18 13:40:32 - RayLog - INFO: - Worker 1 finished episode 71 with reward 200.0 in 200 steps +2023-05-18 13:40:32 - RayLog - INFO: - Worker 0 finished episode 72 with reward 186.0 in 186 steps +2023-05-18 13:40:35 - RayLog - INFO: - Worker 1 finished episode 73 with reward 114.0 in 114 steps +2023-05-18 13:40:35 - RayLog - INFO: - Worker 0 finished episode 74 with reward 109.0 in 109 steps +2023-05-18 13:40:36 - RayLog - INFO: - Worker 1 finished episode 75 with reward 72.0 in 72 steps +2023-05-18 13:40:37 - RayLog - INFO: - learner id: 0, update_step: 3500, online_eval_reward: 83.000 +2023-05-18 13:40:37 - RayLog - INFO: - Worker 0 finished episode 76 with reward 96.0 in 96 steps +2023-05-18 13:40:37 - RayLog - INFO: - Worker 1 finished episode 77 with reward 62.0 in 62 steps +2023-05-18 13:40:38 - RayLog - INFO: - Worker 0 finished episode 78 with reward 88.0 in 88 steps +2023-05-18 13:40:39 - RayLog - INFO: - Worker 1 finished episode 79 with reward 70.0 in 70 steps +2023-05-18 13:40:40 - RayLog - INFO: - Worker 1 finished episode 81 with reward 77.0 in 77 steps +2023-05-18 13:40:42 - RayLog - INFO: - learner id: 0, update_step: 4000, online_eval_reward: 123.000 +2023-05-18 13:40:42 - RayLog - INFO: - Worker 0 finished episode 80 with reward 181.0 in 181 steps +2023-05-18 13:40:42 - RayLog - INFO: - Worker 1 finished episode 82 with reward 105.0 in 105 steps +2023-05-18 13:40:46 - RayLog - INFO: - Worker 0 finished episode 83 with reward 200.0 in 200 steps +2023-05-18 13:40:47 - RayLog - INFO: - Worker 1 finished episode 84 with reward 200.0 in 200 steps +2023-05-18 13:40:47 - RayLog - INFO: - learner id: 0, update_step: 4500, online_eval_reward: 200.000 +2023-05-18 13:40:47 - RayLog - INFO: - learner 0 for current update step obtain a better online_eval_reward: 200.000, save the best model! +2023-05-18 13:40:51 - RayLog - INFO: - Worker 0 finished episode 85 with reward 200.0 in 200 steps +2023-05-18 13:40:51 - RayLog - INFO: - Worker 1 finished episode 86 with reward 200.0 in 200 steps +2023-05-18 13:40:53 - RayLog - INFO: - learner id: 0, update_step: 5000, online_eval_reward: 200.000 +2023-05-18 13:40:56 - RayLog - INFO: - Worker 0 finished episode 87 with reward 200.0 in 200 steps +2023-05-18 13:40:56 - RayLog - INFO: - Worker 1 finished episode 88 with reward 200.0 in 200 steps +2023-05-18 13:40:59 - RayLog - INFO: - learner id: 0, update_step: 5500, online_eval_reward: 200.000 +2023-05-18 13:41:00 - RayLog - INFO: - Worker 0 finished episode 89 with reward 200.0 in 200 steps +2023-05-18 13:41:01 - RayLog - INFO: - Worker 1 finished episode 90 with reward 200.0 in 200 steps +2023-05-18 13:41:05 - RayLog - INFO: - learner id: 0, update_step: 6000, online_eval_reward: 200.000 +2023-05-18 13:41:05 - RayLog - INFO: - Worker 0 finished episode 91 with reward 200.0 in 200 steps +2023-05-18 13:41:05 - RayLog - INFO: - Worker 1 finished episode 92 with reward 200.0 in 200 steps +2023-05-18 13:41:10 - RayLog - INFO: - Worker 0 finished episode 93 with reward 200.0 in 200 steps +2023-05-18 13:41:10 - RayLog - INFO: - Worker 1 finished episode 94 with reward 200.0 in 200 steps +2023-05-18 13:41:11 - RayLog - INFO: - learner id: 0, update_step: 6500, online_eval_reward: 200.000 +2023-05-18 13:41:15 - RayLog - INFO: - Worker 0 finished episode 95 with reward 200.0 in 200 steps +2023-05-18 13:41:15 - RayLog - INFO: - Worker 1 finished episode 96 with reward 200.0 in 200 steps +2023-05-18 13:41:17 - RayLog - INFO: - learner id: 0, update_step: 7000, online_eval_reward: 200.000 +2023-05-18 13:41:19 - RayLog - INFO: - Worker 0 finished episode 97 with reward 200.0 in 200 steps +2023-05-18 13:41:20 - RayLog - INFO: - Worker 1 finished episode 98 with reward 200.0 in 200 steps +2023-05-18 13:41:23 - RayLog - INFO: - learner id: 0, update_step: 7500, online_eval_reward: 200.000 +2023-05-18 13:41:24 - RayLog - INFO: - Worker 0 finished episode 99 with reward 200.0 in 200 steps +2023-05-18 13:41:25 - RayLog - INFO: - Worker 1 finished episode 100 with reward 200.0 in 200 steps +2023-05-18 13:41:28 - SimpleLog - INFO: - Finish training! total time consumed: 100.97s diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/1000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/1000 new file mode 100644 index 0000000000000000000000000000000000000000..74e47feb7a24f50f810c9b7363b233a0326da957 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/1000 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/1500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/1500 new file mode 100644 index 0000000000000000000000000000000000000000..fcf4f1cf8b15576174682078fd929fa9628c2277 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/1500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/2000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/2000 new file mode 100644 index 0000000000000000000000000000000000000000..755a1c7fc9df14aabede89b4b2171730cf295f57 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/2000 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/2500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/2500 new file mode 100644 index 0000000000000000000000000000000000000000..07c910744feaf07798eb1b9b339ce3db6f4e93ed Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/2500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/3000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/3000 new file mode 100644 index 0000000000000000000000000000000000000000..c61013298531435a056aa82fbc2bb40800b44d11 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/3000 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/3500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/3500 new file mode 100644 index 0000000000000000000000000000000000000000..926cce05ffbc708cece3a7ee1008c30e48cebfa4 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/3500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/4000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/4000 new file mode 100644 index 0000000000000000000000000000000000000000..c9d0dc07fd37a07376b4c3d877a5b2ca5c87b6e3 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/4000 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/4500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/4500 new file mode 100644 index 0000000000000000000000000000000000000000..d94502e1889c18e29b2b3b1509a4e7b5e5098672 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/4500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/500 new file mode 100644 index 0000000000000000000000000000000000000000..ed38cb30fe096739b7aa71a21df31b3fbe19bd27 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/5000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/5000 new file mode 100644 index 0000000000000000000000000000000000000000..0215111a35a49a2f7400916d4720e49b9eea3762 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/5000 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/5500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/5500 new file mode 100644 index 0000000000000000000000000000000000000000..cf0237614550d25362fb619aea38e07ede55f475 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/5500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/6000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/6000 new file mode 100644 index 0000000000000000000000000000000000000000..65293febc436b6c2c02014283eafa5e81457fb83 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/6000 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/6500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/6500 new file mode 100644 index 0000000000000000000000000000000000000000..8010d65fd82b91227765a96f36cf5cbcd75e2709 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/6500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/7000 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/7000 new file mode 100644 index 0000000000000000000000000000000000000000..e4705b62089b56812d3c2633544c58f22756bc4a Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/7000 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/7500 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/7500 new file mode 100644 index 0000000000000000000000000000000000000000..b6b6156fea87497141abc96e14ca4176af8b9130 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/7500 differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/best b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/best new file mode 100644 index 0000000000000000000000000000000000000000..d94502e1889c18e29b2b3b1509a4e7b5e5098672 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/models/best differ diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/interact/events.out.tfevents.1684388387.JMac.local.86757.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/interact/events.out.tfevents.1684388387.JMac.local.86757.0 new file mode 100644 index 0000000000000000000000000000000000000000..f7faafe6c2b6faa8af858204bc769a50dbb92de2 --- /dev/null +++ b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/interact/events.out.tfevents.1684388387.JMac.local.86757.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e571710bb077a186d5841f41570cb79c0d8364b23ad6c763b1b9296ceaf0284f +size 40 diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/interact/events.out.tfevents.1684388398.JMac.local.86815.0 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/interact/events.out.tfevents.1684388398.JMac.local.86815.0 new file mode 100644 index 0000000000000000000000000000000000000000..46cd80b5f2d0156cdabca3a13ae067311fb60c02 --- /dev/null +++ b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/interact/events.out.tfevents.1684388398.JMac.local.86815.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:836310578ed6206604d3b1432fc5f35019c383105fbb64f1505a5bd72baf68cb +size 10028 diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/model/events.out.tfevents.1684388387.JMac.local.86757.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/model/events.out.tfevents.1684388387.JMac.local.86757.1 new file mode 100644 index 0000000000000000000000000000000000000000..8db3775f5995cb0d7756083bf2c042a2f313cf09 --- /dev/null +++ b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/model/events.out.tfevents.1684388387.JMac.local.86757.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:104eaae7368044a1396e1f0288356e64792ffebc2905456d3a98edd39438d03c +size 40 diff --git a/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/model/events.out.tfevents.1684388398.JMac.local.86815.1 b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/model/events.out.tfevents.1684388398.JMac.local.86815.1 new file mode 100644 index 0000000000000000000000000000000000000000..c16a4edccd9deded79b4f91247e3d96257e82955 --- /dev/null +++ b/ClassControl/CartPole-v1/Train_ray_CartPole-v1_NoisyDQN_20230518-133947/tb_logs/model/events.out.tfevents.1684388398.JMac.local.86815.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fd21541f93e709c2d2db525eb5b8fb4569896f9ec747de14ab5193752825d5f +size 375106 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/config.yaml b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/config.yaml similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/config.yaml rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/config.yaml diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/logs/log.txt b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/logs/log.txt similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/logs/log.txt rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/logs/log.txt diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1000 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1000 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1000 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1000 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/1500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2000 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2000 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2000 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2000 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/2500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3000 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3000 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3000 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3000 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/3500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4000 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4000 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4000 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4000 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/4500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5000 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5000 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5000 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5000 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/5500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6000 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6000 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6000 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6000 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/6500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7000 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7000 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7000 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7000 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7500 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7500 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7500 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/7500 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/best b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/best similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/best rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/models/best diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.0 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.0 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.0 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.0 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.0 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.0 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.0 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/interact/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.0 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.1 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.1 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.1 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339616.DESKTOP-H34HQIQ.85940.1 diff --git a/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.1 b/ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.1 similarity index 100% rename from CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.1 rename to ClassControl/CartPole-v1/Train_ray_multi_learner_CartPole-v1_DQN_20230518-000656/tb_logs/model/events.out.tfevents.1684339625.DESKTOP-H34HQIQ.86440.1 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/config.yaml b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/config.yaml similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/config.yaml rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/config.yaml diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/logs/log.txt b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/logs/log.txt similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/logs/log.txt rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/logs/log.txt diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/1500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/2500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/3500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/4500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/5500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/6000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/6000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/6000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/6000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/best b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/best similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/best rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/models/best diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/interact/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.0 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/interact/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.0 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/interact/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.0 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/interact/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.0 diff --git a/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/model/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.1 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/model/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.1 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/model/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.1 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DQN_20230515-211721/tb_logs/model/events.out.tfevents.1684156641.DESKTOP-H34HQIQ.65936.1 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/config.yaml b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/config.yaml similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/config.yaml rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/config.yaml diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/logs/log.txt b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/logs/log.txt similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/logs/log.txt rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/logs/log.txt diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/1500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/2500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/3500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/4500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/5500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/best b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/best similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/best rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/models/best diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/interact/events.out.tfevents.1684208740.JMac.local.51823.0 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/interact/events.out.tfevents.1684208740.JMac.local.51823.0 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/interact/events.out.tfevents.1684208740.JMac.local.51823.0 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/interact/events.out.tfevents.1684208740.JMac.local.51823.0 diff --git a/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/model/events.out.tfevents.1684208740.JMac.local.51823.1 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/model/events.out.tfevents.1684208740.JMac.local.51823.1 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/model/events.out.tfevents.1684208740.JMac.local.51823.1 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DoubleDQN_20230516-114540/tb_logs/model/events.out.tfevents.1684208740.JMac.local.51823.1 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/config.yaml b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/config.yaml similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/config.yaml rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/config.yaml diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/logs/log.txt b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/logs/log.txt similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/logs/log.txt rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/logs/log.txt diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/10500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/11500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/12000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/12000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/12000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/12000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/1500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/2500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/3500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/4500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/5500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/6500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/7500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/8500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9000 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9000 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9000 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9500 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9500 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/9500 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/best b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/best similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/best rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/models/best diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/interact/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.0 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/interact/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.0 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/interact/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.0 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/interact/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.0 diff --git a/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/model/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.1 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/model/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.1 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/model/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.1 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_DuelingDQN_20230517-223843/tb_logs/model/events.out.tfevents.1684334323.DESKTOP-H34HQIQ.30484.1 diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/config.yaml b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..c69bd9442fff201ebe58683768db17f54ccf0eae --- /dev/null +++ b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/config.yaml @@ -0,0 +1,47 @@ +general_cfg: + algo_name: NoisyDQN + collect_traj: false + device: cpu + env_name: gym + load_checkpoint: false + load_model_step: best + load_path: Train_CartPole-v1_DQN_20221026-054757 + max_episode: 100 + max_step: 200 + mode: train + model_save_fre: 500 + mp_backend: single + n_learners: 1 + n_workers: 2 + online_eval: true + online_eval_episode: 10 + seed: 1 + share_buffer: true +algo_cfg: + batch_size: 64 + buffer_size: 100000 + buffer_type: REPLAY_QUE + epsilon_decay: 500 + epsilon_end: 0.01 + epsilon_start: 0.95 + gamma: 0.99 + lr: 0.0001 + target_update: 4 + value_layers: + - activation: relu + layer_size: + - 256 + layer_type: noisy_linear + std_init: 0.4 + - activation: relu + layer_size: + - 256 + layer_type: noisy_linear + std_init: 0.4 +env_cfg: + id: CartPole-v1 + ignore_params: + - wrapper + - ignore_params + render_mode: null + wrapper: null diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/logs/log.txt b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/logs/log.txt new file mode 100644 index 0000000000000000000000000000000000000000..dfd7219b62f7ceb730768e2629b02e74709829df --- /dev/null +++ b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/logs/log.txt @@ -0,0 +1,164 @@ +2023-05-18 13:37:37 - SimpleLog - INFO: - General Configs: +2023-05-18 13:37:37 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:37:37 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:37:37 - SimpleLog - INFO: - env_name gym +2023-05-18 13:37:37 - SimpleLog - INFO: - algo_name NoisyDQN +2023-05-18 13:37:37 - SimpleLog - INFO: - mode train +2023-05-18 13:37:37 - SimpleLog - INFO: - device cpu +2023-05-18 13:37:37 - SimpleLog - INFO: - seed 1 +2023-05-18 13:37:37 - SimpleLog - INFO: - max_episode 100 +2023-05-18 13:37:37 - SimpleLog - INFO: - max_step 200 +2023-05-18 13:37:37 - SimpleLog - INFO: - collect_traj 0 +2023-05-18 13:37:37 - SimpleLog - INFO: - mp_backend single +2023-05-18 13:37:37 - SimpleLog - INFO: - n_workers 2 +2023-05-18 13:37:37 - SimpleLog - INFO: - n_learners 1 +2023-05-18 13:37:37 - SimpleLog - INFO: - share_buffer 1 +2023-05-18 13:37:37 - SimpleLog - INFO: - online_eval 1 +2023-05-18 13:37:37 - SimpleLog - INFO: - online_eval_episode 10 +2023-05-18 13:37:37 - SimpleLog - INFO: - model_save_fre 500 +2023-05-18 13:37:37 - SimpleLog - INFO: - load_checkpoint 0 +2023-05-18 13:37:37 - SimpleLog - INFO: - load_path Train_CartPole-v1_DQN_20221026-054757 +2023-05-18 13:37:37 - SimpleLog - INFO: - load_model_step best +2023-05-18 13:37:37 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:37:37 - SimpleLog - INFO: - Algo Configs: +2023-05-18 13:37:37 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:37:37 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:37:37 - SimpleLog - INFO: - epsilon_start 0.95 +2023-05-18 13:37:37 - SimpleLog - INFO: - epsilon_end 0.01 +2023-05-18 13:37:37 - SimpleLog - INFO: - epsilon_decay 500 +2023-05-18 13:37:37 - SimpleLog - INFO: - gamma 0.99 +2023-05-18 13:37:37 - SimpleLog - INFO: - lr 0.0001 +2023-05-18 13:37:37 - SimpleLog - INFO: - buffer_size 100000 +2023-05-18 13:37:37 - SimpleLog - INFO: - batch_size 64 +2023-05-18 13:37:37 - SimpleLog - INFO: - target_update 4 +2023-05-18 13:37:37 - SimpleLog - INFO: - value_layers [{'layer_type': 'noisy_linear', 'layer_size': [256], 'activation': 'relu', 'std_init': 0.4}, {'layer_type': 'noisy_linear', 'layer_size': [256], 'activation': 'relu', 'std_init': 0.4}] +2023-05-18 13:37:37 - SimpleLog - INFO: - buffer_type REPLAY_QUE +2023-05-18 13:37:37 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:37:37 - SimpleLog - INFO: - Env Configs: +2023-05-18 13:37:37 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:37:37 - SimpleLog - INFO: - Name Value Type +2023-05-18 13:37:37 - SimpleLog - INFO: - id CartPole-v1 +2023-05-18 13:37:37 - SimpleLog - INFO: - render_mode None +2023-05-18 13:37:37 - SimpleLog - INFO: - wrapper None +2023-05-18 13:37:37 - SimpleLog - INFO: - ignore_params ['wrapper', 'ignore_params'] +2023-05-18 13:37:37 - SimpleLog - INFO: - ================================================================================ +2023-05-18 13:37:37 - SimpleLog - INFO: - obs_space: Box([-4.8000002e+00 -3.4028235e+38 -4.1887903e-01 -3.4028235e+38], [4.8000002e+00 3.4028235e+38 4.1887903e-01 3.4028235e+38], (4,), float32), n_actions: Discrete(2) +2023-05-18 13:37:37 - SimpleLog - INFO: - Start training! +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 0, ep_reward: 12.0, ep_step: 12 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 1, ep_reward: 23.0, ep_step: 23 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 2, ep_reward: 21.0, ep_step: 21 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 3, ep_reward: 14.0, ep_step: 14 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 4, ep_reward: 24.0, ep_step: 24 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 5, ep_reward: 18.0, ep_step: 18 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 6, ep_reward: 45.0, ep_step: 45 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 7, ep_reward: 30.0, ep_step: 30 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 8, ep_reward: 25.0, ep_step: 25 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 9, ep_reward: 29.0, ep_step: 29 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 10, ep_reward: 13.0, ep_step: 13 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 11, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 12, ep_reward: 11.0, ep_step: 11 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 13, ep_reward: 14.0, ep_step: 14 +2023-05-18 13:37:37 - SimpleLog - INFO: - episode: 14, ep_reward: 12.0, ep_step: 12 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 15, ep_reward: 11.0, ep_step: 11 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 16, ep_reward: 11.0, ep_step: 11 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 17, ep_reward: 28.0, ep_step: 28 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 18, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 19, ep_reward: 13.0, ep_step: 13 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 20, ep_reward: 15.0, ep_step: 15 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 21, ep_reward: 13.0, ep_step: 13 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 22, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 23, ep_reward: 17.0, ep_step: 17 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 24, ep_reward: 21.0, ep_step: 21 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 25, ep_reward: 12.0, ep_step: 12 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 26, ep_reward: 16.0, ep_step: 16 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 27, ep_reward: 13.0, ep_step: 13 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 28, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 29, ep_reward: 12.0, ep_step: 12 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 30, ep_reward: 22.0, ep_step: 22 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 31, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 32, ep_reward: 13.0, ep_step: 13 +2023-05-18 13:37:38 - SimpleLog - INFO: - update_step: 500, online_eval_reward: 10.000 +2023-05-18 13:37:38 - SimpleLog - INFO: - current update step obtain a better online_eval_reward: 10.000, save the best model! +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 33, ep_reward: 14.0, ep_step: 14 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 34, ep_reward: 9.0, ep_step: 9 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 35, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 36, ep_reward: 11.0, ep_step: 11 +2023-05-18 13:37:38 - SimpleLog - INFO: - episode: 37, ep_reward: 9.0, ep_step: 9 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 38, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 39, ep_reward: 14.0, ep_step: 14 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 40, ep_reward: 9.0, ep_step: 9 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 41, ep_reward: 11.0, ep_step: 11 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 42, ep_reward: 9.0, ep_step: 9 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 43, ep_reward: 9.0, ep_step: 9 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 44, ep_reward: 15.0, ep_step: 15 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 45, ep_reward: 15.0, ep_step: 15 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 46, ep_reward: 9.0, ep_step: 9 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 47, ep_reward: 11.0, ep_step: 11 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 48, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 49, ep_reward: 9.0, ep_step: 9 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 50, ep_reward: 12.0, ep_step: 12 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 51, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 52, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 53, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 54, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 55, ep_reward: 10.0, ep_step: 10 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 56, ep_reward: 39.0, ep_step: 39 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 57, ep_reward: 17.0, ep_step: 17 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 58, ep_reward: 20.0, ep_step: 20 +2023-05-18 13:37:39 - SimpleLog - INFO: - episode: 59, ep_reward: 21.0, ep_step: 21 +2023-05-18 13:37:40 - SimpleLog - INFO: - episode: 60, ep_reward: 55.0, ep_step: 55 +2023-05-18 13:37:40 - SimpleLog - INFO: - episode: 61, ep_reward: 26.0, ep_step: 26 +2023-05-18 13:37:40 - SimpleLog - INFO: - episode: 62, ep_reward: 29.0, ep_step: 29 +2023-05-18 13:37:40 - SimpleLog - INFO: - episode: 63, ep_reward: 35.0, ep_step: 35 +2023-05-18 13:37:40 - SimpleLog - INFO: - update_step: 1000, online_eval_reward: 27.000 +2023-05-18 13:37:40 - SimpleLog - INFO: - current update step obtain a better online_eval_reward: 27.000, save the best model! +2023-05-18 13:37:40 - SimpleLog - INFO: - episode: 64, ep_reward: 27.0, ep_step: 27 +2023-05-18 13:37:40 - SimpleLog - INFO: - episode: 65, ep_reward: 41.0, ep_step: 41 +2023-05-18 13:37:40 - SimpleLog - INFO: - episode: 66, ep_reward: 91.0, ep_step: 91 +2023-05-18 13:37:41 - SimpleLog - INFO: - episode: 67, ep_reward: 71.0, ep_step: 71 +2023-05-18 13:37:41 - SimpleLog - INFO: - episode: 68, ep_reward: 72.0, ep_step: 72 +2023-05-18 13:37:41 - SimpleLog - INFO: - episode: 69, ep_reward: 24.0, ep_step: 24 +2023-05-18 13:37:41 - SimpleLog - INFO: - episode: 70, ep_reward: 50.0, ep_step: 50 +2023-05-18 13:37:41 - SimpleLog - INFO: - episode: 71, ep_reward: 85.0, ep_step: 85 +2023-05-18 13:37:42 - SimpleLog - INFO: - update_step: 1500, online_eval_reward: 66.000 +2023-05-18 13:37:42 - SimpleLog - INFO: - current update step obtain a better online_eval_reward: 66.000, save the best model! +2023-05-18 13:37:42 - SimpleLog - INFO: - episode: 72, ep_reward: 183.0, ep_step: 183 +2023-05-18 13:37:42 - SimpleLog - INFO: - episode: 73, ep_reward: 124.0, ep_step: 124 +2023-05-18 13:37:43 - SimpleLog - INFO: - episode: 74, ep_reward: 123.0, ep_step: 123 +2023-05-18 13:37:43 - SimpleLog - INFO: - update_step: 2000, online_eval_reward: 102.000 +2023-05-18 13:37:43 - SimpleLog - INFO: - current update step obtain a better online_eval_reward: 102.000, save the best model! +2023-05-18 13:37:43 - SimpleLog - INFO: - episode: 75, ep_reward: 192.0, ep_step: 192 +2023-05-18 13:37:44 - SimpleLog - INFO: - episode: 76, ep_reward: 115.0, ep_step: 115 +2023-05-18 13:37:44 - SimpleLog - INFO: - episode: 77, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:45 - SimpleLog - INFO: - update_step: 2500, online_eval_reward: 99.000 +2023-05-18 13:37:45 - SimpleLog - INFO: - episode: 78, ep_reward: 171.0, ep_step: 171 +2023-05-18 13:37:45 - SimpleLog - INFO: - episode: 79, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:46 - SimpleLog - INFO: - episode: 80, ep_reward: 125.0, ep_step: 125 +2023-05-18 13:37:46 - SimpleLog - INFO: - update_step: 3000, online_eval_reward: 90.000 +2023-05-18 13:37:46 - SimpleLog - INFO: - episode: 81, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:47 - SimpleLog - INFO: - episode: 82, ep_reward: 140.0, ep_step: 140 +2023-05-18 13:37:47 - SimpleLog - INFO: - episode: 83, ep_reward: 172.0, ep_step: 172 +2023-05-18 13:37:48 - SimpleLog - INFO: - episode: 84, ep_reward: 78.0, ep_step: 78 +2023-05-18 13:37:48 - SimpleLog - INFO: - update_step: 3500, online_eval_reward: 82.000 +2023-05-18 13:37:48 - SimpleLog - INFO: - episode: 85, ep_reward: 92.0, ep_step: 92 +2023-05-18 13:37:48 - SimpleLog - INFO: - episode: 86, ep_reward: 104.0, ep_step: 104 +2023-05-18 13:37:49 - SimpleLog - INFO: - episode: 87, ep_reward: 99.0, ep_step: 99 +2023-05-18 13:37:49 - SimpleLog - INFO: - episode: 88, ep_reward: 81.0, ep_step: 81 +2023-05-18 13:37:49 - SimpleLog - INFO: - episode: 89, ep_reward: 97.0, ep_step: 97 +2023-05-18 13:37:49 - SimpleLog - INFO: - update_step: 4000, online_eval_reward: 106.000 +2023-05-18 13:37:49 - SimpleLog - INFO: - current update step obtain a better online_eval_reward: 106.000, save the best model! +2023-05-18 13:37:49 - SimpleLog - INFO: - episode: 90, ep_reward: 99.0, ep_step: 99 +2023-05-18 13:37:50 - SimpleLog - INFO: - episode: 91, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:50 - SimpleLog - INFO: - episode: 92, ep_reward: 93.0, ep_step: 93 +2023-05-18 13:37:51 - SimpleLog - INFO: - episode: 93, ep_reward: 127.0, ep_step: 127 +2023-05-18 13:37:51 - SimpleLog - INFO: - update_step: 4500, online_eval_reward: 200.000 +2023-05-18 13:37:51 - SimpleLog - INFO: - current update step obtain a better online_eval_reward: 200.000, save the best model! +2023-05-18 13:37:51 - SimpleLog - INFO: - episode: 94, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:52 - SimpleLog - INFO: - episode: 95, ep_reward: 145.0, ep_step: 145 +2023-05-18 13:37:53 - SimpleLog - INFO: - update_step: 5000, online_eval_reward: 200.000 +2023-05-18 13:37:53 - SimpleLog - INFO: - episode: 96, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:53 - SimpleLog - INFO: - episode: 97, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:54 - SimpleLog - INFO: - episode: 98, ep_reward: 168.0, ep_step: 168 +2023-05-18 13:37:54 - SimpleLog - INFO: - update_step: 5500, online_eval_reward: 200.000 +2023-05-18 13:37:55 - SimpleLog - INFO: - episode: 99, ep_reward: 200.0, ep_step: 200 +2023-05-18 13:37:55 - SimpleLog - INFO: - Finish training! total time consumed: 17.76s diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/1000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/1000 new file mode 100644 index 0000000000000000000000000000000000000000..a00854259473db0232c28f5034fdb693693f2c98 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/1000 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/1500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/1500 new file mode 100644 index 0000000000000000000000000000000000000000..e47105cd78b3aae8108c4489e5a6ffa42c62cff6 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/1500 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/2000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/2000 new file mode 100644 index 0000000000000000000000000000000000000000..8117923d0ce025d142f1c92f2618017e77afefc6 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/2000 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/2500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/2500 new file mode 100644 index 0000000000000000000000000000000000000000..cfd02b8c034e52278b98eedcff3d8a163742e9d2 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/2500 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/3000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/3000 new file mode 100644 index 0000000000000000000000000000000000000000..bb96a281b667bd68b14379bfb53d67815e6cbc82 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/3000 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/3500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/3500 new file mode 100644 index 0000000000000000000000000000000000000000..dac226b686bab871a2d3cd74ac2b117339b87470 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/3500 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/4000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/4000 new file mode 100644 index 0000000000000000000000000000000000000000..5d56258c54214abe346018c54630fae29bccfd97 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/4000 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/4500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/4500 new file mode 100644 index 0000000000000000000000000000000000000000..256385d9a14af6907e8d4f9357a38474bc084476 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/4500 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/500 new file mode 100644 index 0000000000000000000000000000000000000000..e0229aa8dd73defe3331a33c26d2f6f118c5139b Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/500 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/5000 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/5000 new file mode 100644 index 0000000000000000000000000000000000000000..9e92d6344ad25415bfd91e4d2999aba9697742e7 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/5000 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/5500 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/5500 new file mode 100644 index 0000000000000000000000000000000000000000..f7467f4ae4a76e74964283bd11a432ade2eb067c Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/5500 differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/best b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/best new file mode 100644 index 0000000000000000000000000000000000000000..256385d9a14af6907e8d4f9357a38474bc084476 Binary files /dev/null and b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/models/best differ diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/tb_logs/interact/events.out.tfevents.1684388257.JMac.local.86406.0 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/tb_logs/interact/events.out.tfevents.1684388257.JMac.local.86406.0 new file mode 100644 index 0000000000000000000000000000000000000000..cf124daffd873d7c796bd43c0f2719882536ab1e --- /dev/null +++ b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/tb_logs/interact/events.out.tfevents.1684388257.JMac.local.86406.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a11e5bd8547e9f08ec39d9101d864b0c14b56d98b9f5599088f630547c6ef2a9 +size 10436 diff --git a/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/tb_logs/model/events.out.tfevents.1684388257.JMac.local.86406.1 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/tb_logs/model/events.out.tfevents.1684388257.JMac.local.86406.1 new file mode 100644 index 0000000000000000000000000000000000000000..172c6199d6af643d1ca5829e7eda51e10d2a66c2 --- /dev/null +++ b/ClassControl/CartPole-v1/Train_single_CartPole-v1_NoisyDQN_20230518-133737/tb_logs/model/events.out.tfevents.1684388257.JMac.local.86406.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e0d109f0247d75bc2227d6d1e7141259fe5312d79d5a5002b4705cddd707059 +size 272941 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/config.yaml b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/config.yaml similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/config.yaml rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/config.yaml diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/logs/log.txt b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/logs/log.txt similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/logs/log.txt rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/logs/log.txt diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/10 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/10 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/10 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/10 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/20 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/20 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/20 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/20 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/30 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/30 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/30 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/30 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/40 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/40 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/40 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/40 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/50 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/50 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/50 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/50 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/60 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/60 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/60 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/60 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/70 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/70 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/70 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/70 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/80 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/80 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/80 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/80 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/best b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/best similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/best rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/models/best diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/interact/events.out.tfevents.1684302280.JMac.local.60840.0 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/interact/events.out.tfevents.1684302280.JMac.local.60840.0 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/interact/events.out.tfevents.1684302280.JMac.local.60840.0 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/interact/events.out.tfevents.1684302280.JMac.local.60840.0 diff --git a/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/model/events.out.tfevents.1684302280.JMac.local.60840.1 b/ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/model/events.out.tfevents.1684302280.JMac.local.60840.1 similarity index 100% rename from CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/model/events.out.tfevents.1684302280.JMac.local.60840.1 rename to ClassControl/CartPole-v1/Train_single_CartPole-v1_PPO_20230517-134440/tb_logs/model/events.out.tfevents.1684302280.JMac.local.60840.1