You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
Copy file name to clipboardExpand all lines: params.py
+9-9Lines changed: 9 additions & 9 deletions
Original file line number
Diff line number
Diff line change
@@ -42,16 +42,16 @@ class train_params:
42
42
DENSE2_SIZE=300# Size of second hidden layer in networks
43
43
FINAL_LAYER_INIT=0.003# Initialise networks' final layer weights in range +/-final_layer_init
44
44
NUM_ATOMS=51# Number of atoms in output layer of distributional critic
45
-
V_MIN=-20.0# Lower bound of critic value output distribution
46
-
V_MAX=0.0# Upper bound of critic value output distribution (V_min and V_max should be chosen based on the range of normalised reward values in the chosen env)
45
+
V_MIN=-10.0# Lower bound of critic value output distribution
46
+
V_MAX=10.0# Upper bound of critic value output distribution (V_min and V_max should be chosen based on the range of normalised reward values in the chosen env)
47
47
TAU=0.001# Parameter for soft target network updates
48
48
USE_BATCH_NORM=False# Whether or not to use batch normalisation in the networks
49
49
50
50
# Files/Directories
51
-
SAVE_CKPT_STEP=10000# Save checkpoint every save_ckpt_step training steps
52
-
CKPT_DIR='./ckpts'# Directory for saving/loading checkpoints
53
-
CKPT_FILE=None# Checkpoint file to load and resume training from (if None, train from scratch)
54
-
LOG_DIR='./logs/train'# Directory for saving Tensorboard logs (if None, do not save logs)
51
+
SAVE_CKPT_STEP=10000# Save checkpoint every save_ckpt_step training steps
52
+
CKPT_DIR='./ckpts/'+ENV# Directory for saving/loading checkpoints
53
+
CKPT_FILE=None# Checkpoint file to load and resume training from (if None, train from scratch)
54
+
LOG_DIR='./logs/train/'+ENV# Directory for saving Tensorboard logs (if None, do not save logs)
55
55
56
56
57
57
classtest_params:
@@ -66,10 +66,10 @@ class test_params:
66
66
MAX_EP_LENGTH=1000# Maximum number of steps per episode
67
67
68
68
# Files/directories
69
-
CKPT_DIR='./ckpts'# Directory for saving/loading checkpoints
69
+
CKPT_DIR='./ckpts/'+ENV# Directory for saving/loading checkpoints
70
70
CKPT_FILE=None# Checkpoint file to load and test (if None, load latest ckpt)
71
71
RESULTS_DIR='./test_results'# Directory for saving txt file of results (if None, do not save results)
72
-
LOG_DIR='./logs/test'# Directory for saving Tensorboard logs (if None, do not save logs)
72
+
LOG_DIR='./logs/test/'+ENV# Directory for saving Tensorboard logs (if None, do not save logs)
73
73
74
74
75
75
classplay_params:
@@ -83,7 +83,7 @@ class play_params:
83
83
MAX_EP_LENGTH=1000# Maximum number of steps per episode
84
84
85
85
# Files/directories
86
-
CKPT_DIR='./ckpts'# Directory for saving/loading checkpoints
86
+
CKPT_DIR='./ckpts/'+ENV# Directory for saving/loading checkpoints
87
87
CKPT_FILE=None# Checkpoint file to load and run (if None, load latest ckpt)
88
88
RECORD_DIR='./video'# Directory to store recorded gif of gameplay (if None, do not record)
# This allows testing to be run alongside training by running 'run_every_new_ckpt.sh', which monitors the ckpt directory and runs test.py every time a new ckpt is added.
0 commit comments