Skip to content

Commit

Permalink
edit to rpe
Browse files Browse the repository at this point in the history
  • Loading branch information
ago109 committed Jul 16, 2024
1 parent c4ed156 commit 9768930
Showing 1 changed file with 6 additions and 3 deletions.
9 changes: 6 additions & 3 deletions ngclearn/components/neurons/graded/rewardErrorCell.py
Original file line number Diff line number Diff line change
Expand Up @@ -76,18 +76,21 @@ def advance_state(self, mu, rpe, n_ep_steps, accum_reward, Ns):

@staticmethod
def _evolve(dt, use_online_predictor, ema_window_len, n_ep_steps, mu,
accum_reward, rpe):
accum_reward, reward, rpe):
accum_reward = accum_reward + reward
n_ep_steps = n_ep_steps + 1
if use_online_predictor is False:
## total episodic reward signal
r = accum_reward/n_ep_steps
mu = (1. - 1./ema_window_len) * mu + (1./ema_window_len) * r
rpe = r - mu
return mu, rpe
return mu, rpe, accum_reward

@resolver(_evolve)
def evolve(self, mu, rpe):
def evolve(self, mu, rpe, accum_reward):
self.mu.set(mu)
self.rpe.set(rpe)
self.accum_reward.set(accum_reward)

@staticmethod
def _reset(batch_size, n_units):
Expand Down

0 comments on commit 9768930

Please sign in to comment.