From 53aff40e93592130c4b71a54a9c543a7e2bdc0a6 Mon Sep 17 00:00:00 2001 From: cun Date: Wed, 1 Sep 2021 10:28:45 +0900 Subject: [PATCH 1/4] register new envs --- .gitignore | 1 + asset/__init__.py | 16 ++++++++++++++++ {gym => asset}/continuous_mountain_car.py | 0 {gym => asset}/pendulum.py | 0 {gym => asset}/rendering.py | 0 ...ountainCarContinuous-h-v1_level_0_actor.pth} | Bin ...ountainCarContinuous-h-v1_level_0_crtic.pth} | Bin ...ountainCarContinuous-h-v1_level_1_actor.pth} | Bin ...ountainCarContinuous-h-v1_level_1_crtic.pth} | Bin ...CarContinuous-h-v1_solved_level_0_actor.pth} | Bin ...CarContinuous-h-v1_solved_level_0_crtic.pth} | Bin ...CarContinuous-h-v1_solved_level_1_actor.pth} | Bin ...CarContinuous-h-v1_solved_level_1_crtic.pth} | Bin ...C_MountainCarContinuous-v0_level_0_actor.pth | Bin ...C_MountainCarContinuous-v0_level_0_crtic.pth | Bin ...C_MountainCarContinuous-v0_level_1_actor.pth | Bin ...C_MountainCarContinuous-v0_level_1_crtic.pth | Bin ...C_MountainCarContinuous-v0_level_2_actor.pth | Bin ...C_MountainCarContinuous-v0_level_2_crtic.pth | Bin ...ainCarContinuous-v0_solved_level_0_actor.pth | Bin ...ainCarContinuous-v0_solved_level_0_crtic.pth | Bin ...ainCarContinuous-v0_solved_level_1_actor.pth | Bin ...ainCarContinuous-v0_solved_level_1_crtic.pth | Bin ...ainCarContinuous-v0_solved_level_2_actor.pth | Bin ...ainCarContinuous-v0_solved_level_2_crtic.pth | Bin .../2level/HAC_Pendulum-h-v1_level_0_actor.pth} | Bin .../2level/HAC_Pendulum-h-v1_level_0_crtic.pth} | Bin .../2level/HAC_Pendulum-h-v1_level_1_actor.pth} | Bin .../2level/HAC_Pendulum-h-v1_level_1_crtic.pth} | Bin .../HAC_Pendulum-h-v1_solved_level_0_actor.pth} | Bin .../HAC_Pendulum-h-v1_solved_level_0_crtic.pth} | Bin .../HAC_Pendulum-h-v1_solved_level_1_actor.pth} | Bin .../HAC_Pendulum-h-v1_solved_level_1_crtic.pth} | Bin requirements.txt | 3 +++ test.py | 5 +++-- 35 files changed, 23 insertions(+), 2 deletions(-) create mode 100644 .gitignore create mode 100644 asset/__init__.py rename {gym => asset}/continuous_mountain_car.py (100%) rename {gym => asset}/pendulum.py (100%) rename {gym => asset}/rendering.py (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_0_actor.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_0_actor.pth} (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_0_crtic.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_0_crtic.pth} (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_1_actor.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_1_actor.pth} (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_1_crtic.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_1_crtic.pth} (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_0_actor.pth} (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_0_crtic.pth} (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_1_actor.pth} (100%) rename preTrained/{MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth => MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_1_crtic.pth} (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_level_0_actor.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_level_0_crtic.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_level_1_actor.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_level_1_crtic.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_level_2_actor.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_level_2_crtic.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_solved_level_2_actor.pth (100%) rename preTrained/{MountainCarContinuous-v0 => MountainCarContinuous-h-v1}/3level/HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_level_0_actor.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_0_actor.pth} (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_level_0_crtic.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_0_crtic.pth} (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_level_1_actor.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_1_actor.pth} (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_level_1_crtic.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_1_crtic.pth} (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_0_actor.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_0_actor.pth} (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_0_crtic.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_0_crtic.pth} (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_1_actor.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_1_actor.pth} (100%) rename preTrained/{Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_1_crtic.pth => Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_1_crtic.pth} (100%) create mode 100644 requirements.txt diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..7e99e36 --- /dev/null +++ b/.gitignore @@ -0,0 +1 @@ +*.pyc \ No newline at end of file diff --git a/asset/__init__.py b/asset/__init__.py new file mode 100644 index 0000000..cf8e9bd --- /dev/null +++ b/asset/__init__.py @@ -0,0 +1,16 @@ +from asset.continuous_mountain_car import Continuous_MountainCarEnv +from asset.pendulum import PendulumEnv + +from gym.envs.registration import register + +register( + id="MountainCarContinuous-h-v1", + entry_point="asset:Continuous_MountainCarEnv", + max_episode_steps=50, +) + +register( + id="Pendulum-h-v1", + entry_point="asset:PendulumEnv", + max_episode_steps=50, +) diff --git a/gym/continuous_mountain_car.py b/asset/continuous_mountain_car.py similarity index 100% rename from gym/continuous_mountain_car.py rename to asset/continuous_mountain_car.py diff --git a/gym/pendulum.py b/asset/pendulum.py similarity index 100% rename from gym/pendulum.py rename to asset/pendulum.py diff --git a/gym/rendering.py b/asset/rendering.py similarity index 100% rename from gym/rendering.py rename to asset/rendering.py diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_0_actor.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_0_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_0_actor.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_0_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_0_crtic.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_0_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_0_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_0_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_1_actor.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_1_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_1_actor.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_1_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_1_crtic.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_1_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_level_1_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_level_1_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_0_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_0_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_0_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_0_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_1_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_1_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth b/preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_1_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/2level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/2level/HAC_MountainCarContinuous-h-v1_solved_level_1_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_0_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_0_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_0_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_0_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_1_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_1_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_1_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_1_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_2_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_2_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_2_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_level_2_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_2_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_2_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_actor.pth diff --git a/preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-v0/3level/HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_0_actor.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_0_actor.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_0_actor.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_0_actor.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_0_crtic.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_0_crtic.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_0_crtic.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_0_crtic.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_1_actor.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_1_actor.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_1_actor.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_1_actor.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_1_crtic.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_1_crtic.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_level_1_crtic.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_level_1_crtic.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_0_actor.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_0_actor.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_0_actor.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_0_actor.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_0_crtic.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_0_crtic.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_0_crtic.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_0_crtic.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_1_actor.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_1_actor.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_1_actor.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_1_actor.pth diff --git a/preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_1_crtic.pth b/preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_1_crtic.pth similarity index 100% rename from preTrained/Pendulum-v0/2level/HAC_Pendulum-v0_solved_level_1_crtic.pth rename to preTrained/Pendulum-h-v1/2level/HAC_Pendulum-h-v1_solved_level_1_crtic.pth diff --git a/requirements.txt b/requirements.txt new file mode 100644 index 0000000..7b79425 --- /dev/null +++ b/requirements.txt @@ -0,0 +1,3 @@ +gym +torch +pyglet \ No newline at end of file diff --git a/test.py b/test.py index c2fdfde..0e4c2a2 100644 --- a/test.py +++ b/test.py @@ -1,5 +1,6 @@ import torch import gym +import asset import numpy as np from HAC import HAC @@ -8,11 +9,11 @@ def test(): #################### Hyperparameters #################### - env_name = "MountainCarContinuous-v0" + env_name = "MountainCarContinuous-h-v1"#"MountainCarContinuous-v0" save_episode = 10 # keep saving every n episodes max_episodes = 5 # max num of training episodes random_seed = 0 - render = False + render = True env = gym.make(env_name) state_dim = env.observation_space.shape[0] From d9267d06b49d0cbd1402eaea8ca5a97dfd658c2a Mon Sep 17 00:00:00 2001 From: cun Date: Sat, 4 Sep 2021 02:28:12 +0900 Subject: [PATCH 2/4] update after feedback --- asset/__init__.py | 2 -- asset/continuous_mountain_car.py | 2 +- asset/pendulum.py | 2 +- ...AC_MountainCarContinuous-h-v1_level_0_actor.pth} | Bin ...AC_MountainCarContinuous-h-v1_level_0_crtic.pth} | Bin ...AC_MountainCarContinuous-h-v1_level_1_actor.pth} | Bin ...AC_MountainCarContinuous-h-v1_level_1_crtic.pth} | Bin ...AC_MountainCarContinuous-h-v1_level_2_actor.pth} | Bin ...AC_MountainCarContinuous-h-v1_level_2_crtic.pth} | Bin ...tainCarContinuous-h-v1_solved_level_0_actor.pth} | Bin ...tainCarContinuous-h-v1_solved_level_0_crtic.pth} | Bin ...tainCarContinuous-h-v1_solved_level_1_actor.pth} | Bin ...tainCarContinuous-h-v1_solved_level_1_crtic.pth} | Bin ...tainCarContinuous-h-v1_solved_level_2_actor.pth} | Bin ...tainCarContinuous-h-v1_solved_level_2_crtic.pth} | Bin test.py | 2 +- train.py | 3 ++- 17 files changed, 5 insertions(+), 6 deletions(-) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_level_0_actor.pth => HAC_MountainCarContinuous-h-v1_level_0_actor.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_level_0_crtic.pth => HAC_MountainCarContinuous-h-v1_level_0_crtic.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_level_1_actor.pth => HAC_MountainCarContinuous-h-v1_level_1_actor.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_level_1_crtic.pth => HAC_MountainCarContinuous-h-v1_level_1_crtic.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_level_2_actor.pth => HAC_MountainCarContinuous-h-v1_level_2_actor.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_level_2_crtic.pth => HAC_MountainCarContinuous-h-v1_level_2_crtic.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_solved_level_0_actor.pth => HAC_MountainCarContinuous-h-v1_solved_level_0_actor.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth => HAC_MountainCarContinuous-h-v1_solved_level_0_crtic.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_solved_level_1_actor.pth => HAC_MountainCarContinuous-h-v1_solved_level_1_actor.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth => HAC_MountainCarContinuous-h-v1_solved_level_1_crtic.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_solved_level_2_actor.pth => HAC_MountainCarContinuous-h-v1_solved_level_2_actor.pth} (100%) rename preTrained/MountainCarContinuous-h-v1/3level/{HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth => HAC_MountainCarContinuous-h-v1_solved_level_2_crtic.pth} (100%) diff --git a/asset/__init__.py b/asset/__init__.py index cf8e9bd..c0d74be 100644 --- a/asset/__init__.py +++ b/asset/__init__.py @@ -6,11 +6,9 @@ register( id="MountainCarContinuous-h-v1", entry_point="asset:Continuous_MountainCarEnv", - max_episode_steps=50, ) register( id="Pendulum-h-v1", entry_point="asset:PendulumEnv", - max_episode_steps=50, ) diff --git a/asset/continuous_mountain_car.py b/asset/continuous_mountain_car.py index 90b2972..98bebdc 100644 --- a/asset/continuous_mountain_car.py +++ b/asset/continuous_mountain_car.py @@ -98,7 +98,7 @@ def render(self, mode='human'): carheight=20 if self.viewer is None: - from gym.envs.classic_control import rendering + from asset import rendering self.viewer = rendering.Viewer(screen_width, screen_height) xs = np.linspace(self.min_position, self.max_position, 100) ys = self._height(xs) diff --git a/asset/pendulum.py b/asset/pendulum.py index decdfcf..dc17dff 100644 --- a/asset/pendulum.py +++ b/asset/pendulum.py @@ -62,7 +62,7 @@ def _get_obs(self): def render(self, mode='human'): if self.viewer is None: - from gym.envs.classic_control import rendering + from asset import rendering self.viewer = rendering.Viewer(500,500) self.viewer.set_bounds(-2.2,2.2,-2.2,2.2) rod = rendering.make_capsule(1, .2) diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_0_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_0_actor.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_0_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_0_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_0_crtic.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_1_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_1_actor.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_1_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_1_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_1_crtic.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_2_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_2_actor.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_2_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_level_2_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_level_2_crtic.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_0_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_0_actor.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_0_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_0_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_0_crtic.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_1_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_1_actor.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_1_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_1_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_1_crtic.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_actor.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_2_actor.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_actor.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_2_actor.pth diff --git a/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth b/preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_2_crtic.pth similarity index 100% rename from preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-v0_solved_level_2_crtic.pth rename to preTrained/MountainCarContinuous-h-v1/3level/HAC_MountainCarContinuous-h-v1_solved_level_2_crtic.pth diff --git a/test.py b/test.py index 0e4c2a2..6c91091 100644 --- a/test.py +++ b/test.py @@ -13,7 +13,7 @@ def test(): save_episode = 10 # keep saving every n episodes max_episodes = 5 # max num of training episodes random_seed = 0 - render = True + render = False env = gym.make(env_name) state_dim = env.observation_space.shape[0] diff --git a/train.py b/train.py index c5abb51..e7e0bd1 100644 --- a/train.py +++ b/train.py @@ -1,5 +1,6 @@ import torch import gym +import asset import numpy as np from HAC import HAC @@ -7,7 +8,7 @@ def train(): #################### Hyperparameters #################### - env_name = "MountainCarContinuous-v0" + env_name = "MountainCarContinuous-h-v1" save_episode = 10 # keep saving every n episodes max_episodes = 1000 # max num of training episodes random_seed = 0 From c55d2b246491345f6b88a60f57c61fa455c5effd Mon Sep 17 00:00:00 2001 From: cun Date: Sat, 4 Sep 2021 14:05:31 +0900 Subject: [PATCH 3/4] importing path fixed --- asset/continuous_mountain_car.py | 4 ++-- asset/pendulum.py | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) diff --git a/asset/continuous_mountain_car.py b/asset/continuous_mountain_car.py index 98bebdc..3c8c0fb 100644 --- a/asset/continuous_mountain_car.py +++ b/asset/continuous_mountain_car.py @@ -152,7 +152,7 @@ def render_goal(self, goal, end_goal, mode='human'): carheight=20 if self.viewer is None: - from gym.envs.classic_control import rendering + from asset import rendering self.viewer = rendering.Viewer(screen_width, screen_height) xs = np.linspace(self.min_position, self.max_position, 100) ys = self._height(xs) @@ -235,7 +235,7 @@ def render_goal_2(self, goal1, goal2, end_goal, mode='human'): if self.viewer is None: - from gym.envs.classic_control import rendering + from asset import rendering self.viewer = rendering.Viewer(screen_width, screen_height) xs = np.linspace(self.min_position, self.max_position, 100) ys = self._height(xs) diff --git a/asset/pendulum.py b/asset/pendulum.py index dc17dff..6880e4f 100644 --- a/asset/pendulum.py +++ b/asset/pendulum.py @@ -89,7 +89,7 @@ def render(self, mode='human'): def render_goal(self, goal, end_goal, mode='human'): if self.viewer is None: - from gym.envs.classic_control import rendering + from asset import rendering self.viewer = rendering.Viewer(500,500) self.viewer.set_bounds(-2.2,2.2,-2.2,2.2) @@ -138,7 +138,7 @@ def render_goal(self, goal, end_goal, mode='human'): def render_goal_2(self, goal1, goal2, end_goal, mode='human'): if self.viewer is None: - from gym.envs.classic_control import rendering + from asset import rendering self.viewer = rendering.Viewer(500,500) self.viewer.set_bounds(-2.2,2.2,-2.2,2.2) From 5ffc1c23a59decbaa49c378d1ed631baed504af1 Mon Sep 17 00:00:00 2001 From: cun Date: Sat, 4 Sep 2021 14:07:32 +0900 Subject: [PATCH 4/4] update requirements --- requirements.txt | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/requirements.txt b/requirements.txt index 7b79425..8f8e260 100644 --- a/requirements.txt +++ b/requirements.txt @@ -1,3 +1,4 @@ gym torch -pyglet \ No newline at end of file +pyglet +six \ No newline at end of file