(self)
| 69 | return self.resid_dropout(self.w2(self.gelu(self.w1(x)))) |
| 70 | |
| 71 | def reset_parameters(self): |
| 72 | self.w1.reset_parameters() |
| 73 | self.w2.reset_parameters() |
| 74 | |
| 75 | |
| 76 | class TransformerBlock(nn.Module): |
nothing calls this directly
no test coverage detected