Method forward

tensorrt_llm/quantization/layers.py:72–74 · view source on GitHub ↗

(self, x)

Source from the content-addressed store, hash-verified

70	self.axis = axis
71
72	def forward(self, x):
73	return quantize(x, self.scaling_factor.value, self.output_dtype,
74	self.axis)
75
76
77	class QuantizePerToken(Module):

test_quantize_per_tensorMethod · 0.95

test_quantize_per_channelMethod · 0.95

quantizeFunction · 0.70

test_quantize_per_tensorMethod · 0.76

test_quantize_per_channelMethod · 0.76