hard-copy update for initializing target networks
(self, net, target_net)
| 259 | self.alpha_optimizer = tf.optimizers.Adam(ALPHA_LR) |
| 260 | |
| 261 | def target_ini(self, net, target_net): |
| 262 | """ hard-copy update for initializing target networks """ |
| 263 | for target_param, param in zip(target_net.trainable_weights, net.trainable_weights): |
| 264 | target_param.assign(param) |
| 265 | return target_net |
| 266 | |
| 267 | def target_soft_update(self, net, target_net, soft_tau): |
| 268 | """ soft update the target net with Polyak averaging """ |