-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.py
42 lines (34 loc) · 1.52 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
from omegaconf import DictConfig
from builders import build_logdir, build_env, build_callback, build_model
from stable_baselines3.common.base_class import BaseAlgorithm
import hydra
class Trainer:
def __init__(self, cfg: DictConfig):
"""
Initialize the trainer class, including setting up log dir, environment, callbacks and model
:param cfg: Hydra config containing all the information about the experiment
"""
self.cfg = cfg
self._setup()
def _setup(self):
self.log_dir = build_logdir(self.cfg)
self.train_env, self.eval_env, self.video_env = build_env(self.cfg.env_name, self.log_dir, self.cfg.seed)
self.cb = build_callback(self.cfg.env_name, self.log_dir, self.eval_env, self.cfg.eval, self.video_env)
self.model = build_model(self.cfg.env_name, self.train_env, self.cfg.model, self.log_dir, self.cfg.seed)
def train(self) -> BaseAlgorithm:
"""
Training the model using stable-baselines3 function model.learn
:return: The trained model
"""
self.model.learn(total_timesteps=self.cfg.train.time_steps, log_interval=5, callback=self.cb)
self.train_env.close()
self.eval_env.close()
self.video_env.close()
return self.model
@hydra.main(version_base=None, config_path="hydra_config", config_name="default")
def main(cfg: DictConfig):
print(f"Training model {cfg.model.name} in {cfg.env_name} env")
trainer = Trainer(cfg)
trainer.train()
if __name__ == "__main__":
main()