We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 2c407db commit c27ed37Copy full SHA for c27ed37
Reinforcement_learning_TUT/experiments/Solve_BipedalWalker/A3C.py
@@ -25,11 +25,11 @@
25
N_WORKERS = multiprocessing.cpu_count()
26
MAX_GLOBAL_EP = 8000
27
GLOBAL_NET_SCOPE = 'Global_Net'
28
-UPDATE_GLOBAL_ITER = 5
29
-GAMMA = 0.99
+UPDATE_GLOBAL_ITER = 10
+GAMMA = 0.999
30
ENTROPY_BETA = 0.005
31
-LR_A = 0.0001 # learning rate for actor
32
-LR_C = 0.001 # learning rate for critic
+LR_A = 0.00002 # learning rate for actor
+LR_C = 0.0001 # learning rate for critic
33
GLOBAL_RUNNING_R = []
34
GLOBAL_EP = 0
35
0 commit comments