Skip to content

Commit

Permalink
PLR setup but slow
Browse files Browse the repository at this point in the history
  • Loading branch information
RyanNavillus committed Nov 8, 2024
1 parent f9db936 commit 2aa6ad6
Show file tree
Hide file tree
Showing 2 changed files with 3 additions and 1 deletion.
2 changes: 1 addition & 1 deletion reinforcement_learning/clean_pufferl.py
Original file line number Diff line number Diff line change
Expand Up @@ -313,7 +313,7 @@ def evaluate(data):
next_lstm_state[0][:, env_id],
next_lstm_state[1][:, env_id],
)

print("puffer shape", o.shape)
actions, logprob, value, next_lstm_state = data.policy_pool.forwards(
o.to(data.device), next_lstm_state
)
Expand Down
2 changes: 2 additions & 0 deletions syllabus_wrapper.py
Original file line number Diff line number Diff line change
Expand Up @@ -105,6 +105,8 @@ def _prepare_state(self, state):
new_state.append(np.stack(padded_obs.values()))

state = torch.Tensor(np.stack(new_state)).to(self.device)
print("syllabus shape", state.shape)

return state

def _set_eval_mode(self):
Expand Down

0 comments on commit 2aa6ad6

Please sign in to comment.