(x:Tensor, start_pos:int|UOp)
| 132 | # we pass in the weights implicitly so we unpack the GGUF on the fly |
| 133 | @function(precompile=True, allow_implicit=True) |
| 134 | def _run(x:Tensor, start_pos:int|UOp): |
| 135 | h = x + self._attention(self.attn_norm(x), start_pos) |
| 136 | return (h + self._feed_forward(self.ffn_norm(h))).contiguous() |
| 137 | return _run(x, start_pos) |
| 138 | |
| 139 | class TransformerBlock(FFNBlock): |
nothing calls this directly
no test coverage detected