(
self: SelfSAC,
total_timesteps: int,
callback: MaybeCallback = None,
log_interval: int = 4,
tb_log_name: str = "SAC",
reset_num_timesteps: bool = True,
progress_bar: bool = False,
)
| 302 | self.logger.record("train/ent_coef_loss", np.mean(ent_coef_losses)) |
| 303 | |
| 304 | def learn( |
| 305 | self: SelfSAC, |
| 306 | total_timesteps: int, |
| 307 | callback: MaybeCallback = None, |
| 308 | log_interval: int = 4, |
| 309 | tb_log_name: str = "SAC", |
| 310 | reset_num_timesteps: bool = True, |
| 311 | progress_bar: bool = False, |
| 312 | ) -> SelfSAC: |
| 313 | return super().learn( |
| 314 | total_timesteps=total_timesteps, |
| 315 | callback=callback, |
| 316 | log_interval=log_interval, |
| 317 | tb_log_name=tb_log_name, |
| 318 | reset_num_timesteps=reset_num_timesteps, |
| 319 | progress_bar=progress_bar, |
| 320 | ) |
| 321 | |
| 322 | def _excluded_save_params(self) -> list[str]: |
| 323 | return super()._excluded_save_params() + ["actor", "critic", "critic_target"] # noqa: RUF005 |
no outgoing calls