(model, quant_config: QuantConfig)
| 222 | |
| 223 | |
| 224 | def smooth_quantize(model, quant_config: QuantConfig): |
| 225 | assert quant_config.quant_mode.has_act_and_weight_quant() |
| 226 | if quant_config.quant_algo in W8A8_SQ_PLUGIN_LIST: |
| 227 | return smooth_quantize_plugin(model, quant_config.quant_mode) |
| 228 | else: |
| 229 | return smooth_quantize_ootb(model, quant_config) |
| 230 | |
| 231 | |
| 232 | def fp8_quantize(model, quant_config: QuantConfig): |
no test coverage detected