Commit 70cbcff3 authored by holgadoa's avatar holgadoa

new parameters

parent 29fcf1f9
......@@ -40,16 +40,27 @@ class AgentA2C(ptanMod.agent.BaseAgent):
return np.array(actions), agent_states
ENV_ID = "HalfCheetahBulletEnv-v0"
GAMMA = 0.99
# GAMMA = 0.99
# GAE_LAMBDA = 0.95
#
# TRAJECTORY_SIZE = 2049
# LEARNING_RATE_CRITIC = 1e-3
#
# TRPO_MAX_KL = 0.01
# TRPO_DAMPING = 0.1
#
# TEST_ITERS = 100000
GAMMA = 0.98
GAE_LAMBDA = 0.95
TRAJECTORY_SIZE = 2049
TRAJECTORY_SIZE = 8192
LEARNING_RATE_CRITIC = 1e-3
TRPO_MAX_KL = 0.01
TRPO_DAMPING = 0.1
TRPO_MAX_KL = 0.001
TRPO_DAMPING = 0.001
TEST_ITERS = 100000
TEST_ITERS = 1000
def calc_adv_ref(trajectory, net_crt, states_v, device="cpu"):
"""
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment