Method _get_quant_cfg

tensorrt_llm/models/modeling_utils.py:199–207 · view source on GitHub ↗

(self, module_name=None)

Source from the content-addressed store, hash-verified

197	return False
198
199	def _get_quant_cfg(self, module_name=None):
200	if self.exclude_modules is not None:
201	for exclude_module in self.exclude_modules:
202	if exclude_module == module_name or (
203	exclude_module.endswith('*')
204	and module_name.startswith(exclude_module[:-1])):
205	return LayerQuantConfig(quant_algo=None,
206	quantized_layers={})
207	return self
208
209	def _get_modelopt_qformat(self):
210	algo_to_modelopt_map = {

quantizeFunction · 0.45

_get_quant_cfgMethod · 0.45

fuse_gate_mlpFunction · 0.45

unfuse_qkv_gemmFunction · 0.45

preprocess_weightsFunction · 0.45

LayerQuantConfigClass · 0.85

no test coverage detected