minor fix
This commit is contained in:
parent
4a55570be6
commit
ee409846f3
|
@ -40,7 +40,7 @@ def learn(position, actor_models, model, batch, optimizer, flags, lock):
|
||||||
if position != "bidding":
|
if position != "bidding":
|
||||||
episode_returns = batch['episode_return'][batch['done'] & (batch["obs_type"] == position_index[position])]
|
episode_returns = batch['episode_return'][batch['done'] & (batch["obs_type"] == position_index[position])]
|
||||||
else:
|
else:
|
||||||
episode_returns = batch['episode_return'][batch['done'] & ((batch["obs_type"] == 41) | (batch["obs_type"] == 42) | (batch["obs_type"] == 43))]
|
episode_returns = batch['episode_return'][batch['done'] & ((batch["obs_type"] == 41) | (batch["obs_type"] == 42) | (batch["obs_type"] == 43) | (batch["obs_type"] == 44))]
|
||||||
if len(episode_returns) > 0:
|
if len(episode_returns) > 0:
|
||||||
mean_episode_return_buf[position].append(torch.mean(episode_returns).to(device))
|
mean_episode_return_buf[position].append(torch.mean(episode_returns).to(device))
|
||||||
with lock:
|
with lock:
|
||||||
|
|
Loading…
Reference in New Issue