(step)
| 402 | old_params = self.get_pi_params() |
| 403 | |
| 404 | def set_and_eval(step): |
| 405 | params = old_params - alpha * x * step |
| 406 | self.set_pi_params(params) |
| 407 | d_kl = self.kl(states, old_mu, old_log_std) |
| 408 | loss = self.pi_loss(states, actions, adv, logp_old_ph) |
| 409 | return [d_kl, loss] |
| 410 | |
| 411 | # trpo with backtracking line search, hard kl |
| 412 | for j in range(BACKTRACK_ITERS): |
nothing calls this directly
no test coverage detected