(self, obs)
| 117 | self.real_total_rewards = [] |
| 118 | |
| 119 | def update_state(self, obs): |
| 120 | # Do frame-stacking here instead of the FrameStack wrapper to reduce IPC overhead |
| 121 | self.state = np.roll(self.state, shift=-self.nc, axis=3) |
| 122 | self.state[:, :, :, -self.nc:] = obs |
| 123 | |
| 124 | def run(self): |
| 125 | mb_states, mb_rewards, mb_actions, mb_values, mb_dones = [], [], [], [], [] |