(self, hidden_states, cu_seqlens=None, indexes=None, inference_params=None, max_seqlen=None)
| 161 | normal_(std=0.006 if "fc1" in name else 0.0015)(param.data) |
| 162 | |
| 163 | def forward(self, hidden_states, cu_seqlens=None, indexes=None, inference_params=None, max_seqlen=None): |
| 164 | if self.checkpoint and self.training: |
| 165 | return activation_checkpoint( |
| 166 | self._forward, False, hidden_states, cu_seqlens, indexes, inference_params, max_seqlen |
| 167 | ) |
| 168 | else: |
| 169 | return self._forward(hidden_states, cu_seqlens, indexes, inference_params, max_seqlen) |
| 170 | |
| 171 | def _forward(self, hidden_states=None, cu_seqlens=None, indexes=None, inference_params=None, max_seqlen=None): |
| 172 | r"""Pass the input through the encoder layer. |
nothing calls this directly
no test coverage detected