-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathParameters.py
89 lines (71 loc) · 1.57 KB
/
Parameters.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
#### Pendulum Parameters
""" # General parameters
BATCH_SIZE = 64
EPOCHS = 200
FITTING_ITERATIONS = 3
GAMMA = 0.9
BUFFER_SIZE = 100000
WASHOUT = 5000
LEARN_ONLINE = True
BATCH_ITERATIONS = 300
# Frame skipping
SKIP_FRAMES = False
FRAME_SKIP = 20
# Normalize actions
NORMALIZE_ACTIONS = True
# Early stopping
EARLY_STOPPING = False
WINDOW_SIZE = 3
# resicual connections for agent
USE_RESIDUALS = False
# imitation learning parameters:
USE_IMITATION_LEARNING = False
IMITATION_BATCH_SIZE = 32
IMITATION_BUFFER_SIZE = 10000
IMITATION_LAMBDA = 1 / IMITATION_BATCH_SIZE
# parameter noise
PARAMETER_NOISE = False
INITIAL_NOISE_STD = 0.3
DESIRED_ACTION_STD = 0.1
ADAPT_COEFFICIENT = 1.05
# DDPG parameters
TAU = 0.001
ACTOR_LEARNING_RATE = 1e-4
CRITIC_LEARNING_RATE = 1e-3
"""
#ACTOR_LEARNING_RATE = 0
#CRITIC_LEARNING_RATE = 0
#### Hockey Parameters
# General parameters
BATCH_SIZE = 256
EPOCHS = 10000
FITTING_ITERATIONS = 3
GAMMA = 0.85
BUFFER_SIZE = 1000000
WASHOUT = 50000
LEARN_ONLINE = True
BATCH_ITERATIONS = 300
# Frame skipping
SKIP_FRAMES = True
FRAME_SKIP = 5
# Normalize actions
NORMALIZE_ACTIONS = True
# Early stopping
EARLY_STOPPING = False
WINDOW_SIZE = 3
# resicual connections for agent
USE_RESIDUALS = False
# imitation learning parameters:
USE_IMITATION_LEARNING = True
IMITATION_BATCH_SIZE = 128
IMITATION_BUFFER_SIZE = 10000
IMITATION_LAMBDA = 1 / IMITATION_BATCH_SIZE
# parameter noise
PARAMETER_NOISE = True
INITIAL_NOISE_STD = 1
DESIRED_ACTION_STD = 0.1
ADAPT_COEFFICIENT = 1.05
# DDPG parameters
TAU = 0.001
ACTOR_LEARNING_RATE = 1e-4
CRITIC_LEARNING_RATE = 1e-3