Commit a2d218fa authored by Eduard Pizur's avatar Eduard Pizur
Browse files

Merge branch 'master' of git.kpi.fei.tuke.sk:ep858fo/dp-2020 into master

parents fba65de5 f5cc4cfd
......@@ -99,7 +99,7 @@ class Agent():
max_next_actions = T.argmax(q_vals_next_net, dim=1)
q_vals_next_target_net = self.target_network.forward(next_states)
q_vals_next_target_net = q_vals_net.gather(1, max_next_actions.unsqueeze(-1)).squeeze(-1)
q_vals_next_target_net = q_vals_next_target_net.gather(1, max_next_actions.unsqueeze(-1)).squeeze(-1)
q_vals_next_target_net[dones] = 0.0
q_vals_next_target_net = q_vals_next_target_net.detach()
......
......@@ -7,7 +7,7 @@ DISCOUNT_FACTOR = 0.99
EPSILON_START = 1
EPSILON_DECREMENT = 0.00001
EPSILON_MINIMUM = 0.05
NUM_OF_EPISODES = 600
NUM_OF_EPISODES = 6000
TARGET_NET_UPDATE = 1_000
BATCH_SIZE = 32
REPLAY_MEMORY_SIZE = 10_000
......
Supports Markdown
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment